20241028-07:24:13 argv ./main.py --nb_models=1 --gpus=1 --model=XL --batch_size=4 --eval_batch_size=4 --result_dir=results_culture_XL --learning_rate=2e-4 --accuracy_to_make_c_quizzes=0.99 20241028-07:24:13 args.log_filename train.log 20241028-07:24:13 args.result_dir results_culture_XL 20241028-07:24:13 args.seed 0 20241028-07:24:13 args.resume False 20241028-07:24:13 args.optimizer adam 20241028-07:24:13 args.nb_warmup_samples 5000 20241028-07:24:13 args.nb_epochs 10000 20241028-07:24:13 args.batch_size 4 20241028-07:24:13 args.train_batch_size None 20241028-07:24:13 args.eval_batch_size 4 20241028-07:24:13 args.nb_train_samples 50000 20241028-07:24:13 args.nb_test_samples 2500 20241028-07:24:13 args.nb_c_quizzes 5000 20241028-07:24:13 args.c_quiz_multiplier 1 20241028-07:24:13 args.learning_rate 0.0002 20241028-07:24:13 args.gradient_clipping None 20241028-07:24:13 args.nb_have_to_be_correct 3 20241028-07:24:13 args.nb_have_to_be_wrong 1 20241028-07:24:13 args.nb_mistakes_to_be_wrong 5 20241028-07:24:13 args.model_type standard 20241028-07:24:13 args.model XL 20241028-07:24:13 args.dim_model 1536 20241028-07:24:13 args.dim_keys 96 20241028-07:24:13 args.dim_hidden 4096 20241028-07:24:13 args.nb_heads 16 20241028-07:24:13 args.nb_blocks 32 20241028-07:24:13 args.dropout 0.5 20241028-07:24:13 args.nb_threads 1 20241028-07:24:13 args.gpus 1 20241028-07:24:13 args.nb_models 1 20241028-07:24:13 args.diffusion_nb_iterations 25 20241028-07:24:13 args.diffusion_proba_corruption 0.05 20241028-07:24:13 args.accuracy_to_make_c_quizzes 0.99 20241028-07:24:13 args.proba_prompt_noise 0.05 20241028-07:24:13 args.proba_hint 0.25 20241028-07:24:13 args.quizzes None 20241028-07:24:13 args.test None 20241028-07:24:13 args.grids_world_tasks replace_color,translate,grow,frame 20241028-07:24:24 main_device cuda:1 gpus ['cuda:1'] 20241028-07:24:24 vocabulary_size 11 20241028-07:24:27 nb_parameters 705070603 (705M) 20241028-07:24:27 wrote state.pth 20241028-07:24:27 --- epoch 0 ---------------------------------------- 20241028-07:24:27 current_test_accuracies 0.0000 20241028-07:24:27 no_c_quiz 20241028-07:24:27 weakest_accuracies [0.0] 20241028-07:24:40 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-07:58:24 train_loss 0 model 0 0.67235953125 20241028-07:58:24 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-07:58:46 test_loss 0 model 0 0.150032421875 20241028-07:58:46 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-07:59:08 test_accuracy 0 model 0 nb_correct 0 / 2500 (0.00%) 20241028-07:59:08 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-07:59:50 wrote ae_*.pth 20241028-07:59:50 epoch_duration 35min22s next_finish 08:35:12 20241028-07:59:50 wrote state.pth 20241028-07:59:50 --- epoch 1 ---------------------------------------- 20241028-07:59:50 current_test_accuracies 0.0000 20241028-07:59:50 no_c_quiz 20241028-07:59:50 weakest_accuracies [0.0] 20241028-07:59:50 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-08:34:48 train_loss 1 model 0 0.125338134765625 20241028-08:34:48 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-08:35:10 test_loss 1 model 0 0.0701385009765625 20241028-08:35:10 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-08:35:32 test_accuracy 1 model 0 nb_correct 752 / 2500 (30.08%) 20241028-08:35:32 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-08:36:16 wrote ae_*.pth 20241028-08:36:16 epoch_duration 36min26s next_finish 09:12:42 20241028-08:36:16 wrote state.pth 20241028-08:36:16 --- epoch 2 ---------------------------------------- 20241028-08:36:16 current_test_accuracies 0.3008 20241028-08:36:16 no_c_quiz 20241028-08:36:16 weakest_accuracies [0.3008] 20241028-08:36:16 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-09:11:14 train_loss 2 model 0 0.08541520874023438 20241028-09:11:14 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-09:11:36 test_loss 2 model 0 0.0533382080078125 20241028-09:11:36 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-09:11:58 test_accuracy 2 model 0 nb_correct 907 / 2500 (36.28%) 20241028-09:11:58 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-09:12:42 wrote ae_*.pth 20241028-09:12:42 epoch_duration 36min25s next_finish 09:49:08 20241028-09:12:42 wrote state.pth 20241028-09:12:42 --- epoch 3 ---------------------------------------- 20241028-09:12:42 current_test_accuracies 0.3628 20241028-09:12:42 no_c_quiz 20241028-09:12:42 weakest_accuracies [0.3628] 20241028-09:12:42 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-09:47:40 train_loss 3 model 0 0.07149109016418458 20241028-09:47:40 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-09:48:02 test_loss 3 model 0 0.04957075653076172 20241028-09:48:02 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-09:48:24 test_accuracy 3 model 0 nb_correct 1255 / 2500 (50.20%) 20241028-09:48:24 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-09:49:10 wrote ae_*.pth 20241028-09:49:10 epoch_duration 36min27s next_finish 10:25:38 20241028-09:49:10 wrote state.pth 20241028-09:49:10 --- epoch 4 ---------------------------------------- 20241028-09:49:10 current_test_accuracies 0.5020 20241028-09:49:10 no_c_quiz 20241028-09:49:10 weakest_accuracies [0.502] 20241028-09:49:10 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-10:24:08 train_loss 4 model 0 0.06334042610168457 20241028-10:24:08 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-10:24:30 test_loss 4 model 0 0.037710278511047364 20241028-10:24:30 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-10:24:52 test_accuracy 4 model 0 nb_correct 1381 / 2500 (55.24%) 20241028-10:24:52 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-10:25:35 wrote ae_*.pth 20241028-10:25:35 epoch_duration 36min25s next_finish 11:02:01 20241028-10:25:35 wrote state.pth 20241028-10:25:35 --- epoch 5 ---------------------------------------- 20241028-10:25:35 current_test_accuracies 0.5524 20241028-10:25:35 no_c_quiz 20241028-10:25:35 weakest_accuracies [0.5524] 20241028-10:25:35 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-11:00:33 train_loss 5 model 0 0.05667724517822265 20241028-11:00:33 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-11:00:55 test_loss 5 model 0 0.0348542049407959 20241028-11:00:55 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-11:01:17 test_accuracy 5 model 0 nb_correct 1496 / 2500 (59.84%) 20241028-11:01:17 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-11:02:02 wrote ae_*.pth 20241028-11:02:02 epoch_duration 36min26s next_finish 11:38:28 20241028-11:02:02 wrote state.pth 20241028-11:02:02 --- epoch 6 ---------------------------------------- 20241028-11:02:02 current_test_accuracies 0.5984 20241028-11:02:02 no_c_quiz 20241028-11:02:02 weakest_accuracies [0.5984] 20241028-11:02:02 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-11:37:01 train_loss 6 model 0 0.05102941383361816 20241028-11:37:01 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-11:37:23 test_loss 6 model 0 0.042854804706573484 20241028-11:37:23 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-11:37:45 test_accuracy 6 model 0 nb_correct 1806 / 2500 (72.24%) 20241028-11:37:45 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-11:38:27 wrote ae_*.pth 20241028-11:38:27 epoch_duration 36min24s next_finish 12:14:52 20241028-11:38:27 wrote state.pth 20241028-11:38:27 --- epoch 7 ---------------------------------------- 20241028-11:38:27 current_test_accuracies 0.7224 20241028-11:38:27 no_c_quiz 20241028-11:38:27 weakest_accuracies [0.7224] 20241028-11:38:27 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-12:13:25 train_loss 7 model 0 0.04699749176979065 20241028-12:13:25 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-12:13:47 test_loss 7 model 0 0.045373725891113284 20241028-12:13:47 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-12:14:09 test_accuracy 7 model 0 nb_correct 1849 / 2500 (73.96%) 20241028-12:14:09 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-12:14:53 wrote ae_*.pth 20241028-12:14:53 epoch_duration 36min25s next_finish 12:51:19 20241028-12:14:53 wrote state.pth 20241028-12:14:53 --- epoch 8 ---------------------------------------- 20241028-12:14:53 current_test_accuracies 0.7396 20241028-12:14:53 no_c_quiz 20241028-12:14:53 weakest_accuracies [0.7396] 20241028-12:14:53 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-12:49:51 train_loss 8 model 0 0.04347281683921814 20241028-12:49:51 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-12:50:13 test_loss 8 model 0 0.02562827293872833 20241028-12:50:13 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-12:50:35 test_accuracy 8 model 0 nb_correct 2080 / 2500 (83.20%) 20241028-12:50:35 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-12:51:16 wrote ae_*.pth 20241028-12:51:16 epoch_duration 36min23s next_finish 13:27:40 20241028-12:51:16 wrote state.pth 20241028-12:51:16 --- epoch 9 ---------------------------------------- 20241028-12:51:16 current_test_accuracies 0.8320 20241028-12:51:16 no_c_quiz 20241028-12:51:16 weakest_accuracies [0.832] 20241028-12:51:17 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-13:26:14 train_loss 9 model 0 0.040890128712654114 20241028-13:26:14 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-13:26:36 test_loss 9 model 0 0.03381906714439392 20241028-13:26:36 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-13:26:59 test_accuracy 9 model 0 nb_correct 2184 / 2500 (87.36%) 20241028-13:26:59 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-13:27:41 wrote ae_*.pth 20241028-13:27:41 epoch_duration 36min24s next_finish 14:04:05 20241028-13:27:41 wrote state.pth 20241028-13:27:41 --- epoch 10 ---------------------------------------- 20241028-13:27:41 current_test_accuracies 0.8736 20241028-13:27:41 no_c_quiz 20241028-13:27:41 weakest_accuracies [0.8736] 20241028-13:27:41 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-14:02:39 train_loss 10 model 0 0.03900787299871445 20241028-14:02:39 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-14:03:01 test_loss 10 model 0 0.02687938135266304 20241028-14:03:01 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-14:03:23 test_accuracy 10 model 0 nb_correct 2276 / 2500 (91.04%) 20241028-14:03:23 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-14:04:04 wrote ae_*.pth 20241028-14:04:04 epoch_duration 36min23s next_finish 14:40:27 20241028-14:04:04 wrote state.pth 20241028-14:04:04 --- epoch 11 ---------------------------------------- 20241028-14:04:04 current_test_accuracies 0.9104 20241028-14:04:04 no_c_quiz 20241028-14:04:04 weakest_accuracies [0.9104] 20241028-14:04:04 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-14:39:03 train_loss 11 model 0 0.03711862957239151 20241028-14:39:03 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-14:39:25 test_loss 11 model 0 0.03157089660167694 20241028-14:39:25 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-14:39:47 test_accuracy 11 model 0 nb_correct 2336 / 2500 (93.44%) 20241028-14:39:47 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-14:40:28 wrote ae_*.pth 20241028-14:40:28 epoch_duration 36min24s next_finish 15:16:53 20241028-14:40:28 wrote state.pth 20241028-14:40:28 --- epoch 12 ---------------------------------------- 20241028-14:40:28 current_test_accuracies 0.9344 20241028-14:40:28 no_c_quiz 20241028-14:40:28 weakest_accuracies [0.9344] 20241028-14:40:28 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-15:15:26 train_loss 12 model 0 0.03597815713644028 20241028-15:15:26 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-15:15:48 test_loss 12 model 0 0.029833321404457092 20241028-15:15:48 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-15:16:10 test_accuracy 12 model 0 nb_correct 2343 / 2500 (93.72%) 20241028-15:16:10 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-15:16:53 wrote ae_*.pth 20241028-15:16:53 epoch_duration 36min24s next_finish 15:53:17 20241028-15:16:53 wrote state.pth 20241028-15:16:53 --- epoch 13 ---------------------------------------- 20241028-15:16:53 current_test_accuracies 0.9372 20241028-15:16:53 no_c_quiz 20241028-15:16:53 weakest_accuracies [0.9372] 20241028-15:16:53 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-15:51:51 train_loss 13 model 0 0.034544429858922955 20241028-15:51:51 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-15:52:13 test_loss 13 model 0 0.032570691561698915 20241028-15:52:13 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-15:52:35 test_accuracy 13 model 0 nb_correct 2333 / 2500 (93.32%) 20241028-15:52:35 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-15:53:17 wrote ae_*.pth 20241028-15:53:17 epoch_duration 36min24s next_finish 16:29:41 20241028-15:53:17 wrote state.pth 20241028-15:53:17 --- epoch 14 ---------------------------------------- 20241028-15:53:17 current_test_accuracies 0.9332 20241028-15:53:17 no_c_quiz 20241028-15:53:17 weakest_accuracies [0.9332] 20241028-15:53:17 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-16:28:16 train_loss 14 model 0 0.033375559336543084 20241028-16:28:16 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-16:28:38 test_loss 14 model 0 0.024757436454296112 20241028-16:28:38 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-16:29:00 test_accuracy 14 model 0 nb_correct 2402 / 2500 (96.08%) 20241028-16:29:00 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-16:29:41 wrote ae_*.pth 20241028-16:29:41 epoch_duration 36min24s next_finish 17:06:06 20241028-16:29:41 wrote state.pth 20241028-16:29:41 --- epoch 15 ---------------------------------------- 20241028-16:29:41 current_test_accuracies 0.9608 20241028-16:29:41 no_c_quiz 20241028-16:29:41 weakest_accuracies [0.9608] 20241028-16:29:41 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-17:04:39 train_loss 15 model 0 0.03266740776628256 20241028-17:04:39 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-17:05:01 test_loss 15 model 0 0.02359001075029373 20241028-17:05:01 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-17:05:23 test_accuracy 15 model 0 nb_correct 2376 / 2500 (95.04%) 20241028-17:05:23 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-17:06:05 wrote ae_*.pth 20241028-17:06:05 epoch_duration 36min23s next_finish 17:42:28 20241028-17:06:05 wrote state.pth 20241028-17:06:05 --- epoch 16 ---------------------------------------- 20241028-17:06:05 current_test_accuracies 0.9504 20241028-17:06:05 no_c_quiz 20241028-17:06:05 weakest_accuracies [0.9504] 20241028-17:06:05 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-17:41:03 train_loss 16 model 0 0.03182626745939255 20241028-17:41:03 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-17:41:25 test_loss 16 model 0 0.02550815589427948 20241028-17:41:25 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-17:41:47 test_accuracy 16 model 0 nb_correct 2362 / 2500 (94.48%) 20241028-17:41:47 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-17:42:28 wrote ae_*.pth 20241028-17:42:28 epoch_duration 36min23s next_finish 18:18:52 20241028-17:42:28 wrote state.pth 20241028-17:42:28 --- epoch 17 ---------------------------------------- 20241028-17:42:28 current_test_accuracies 0.9448 20241028-17:42:28 no_c_quiz 20241028-17:42:28 weakest_accuracies [0.9448] 20241028-17:42:28 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-18:17:27 train_loss 17 model 0 0.03078445198625326 20241028-18:17:27 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-18:17:49 test_loss 17 model 0 0.028616854476928712 20241028-18:17:49 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-18:18:11 test_accuracy 17 model 0 nb_correct 2380 / 2500 (95.20%) 20241028-18:18:11 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-18:18:53 wrote ae_*.pth 20241028-18:18:53 epoch_duration 36min24s next_finish 18:55:17 20241028-18:18:53 wrote state.pth 20241028-18:18:53 --- epoch 18 ---------------------------------------- 20241028-18:18:53 current_test_accuracies 0.9520 20241028-18:18:53 no_c_quiz 20241028-18:18:53 weakest_accuracies [0.952] 20241028-18:18:53 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-18:53:51 train_loss 18 model 0 0.030339936298131944 20241028-18:53:51 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-18:54:13 test_loss 18 model 0 0.025002933663129806 20241028-18:54:13 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-18:54:35 test_accuracy 18 model 0 nb_correct 2410 / 2500 (96.40%) 20241028-18:54:35 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-18:55:16 wrote ae_*.pth 20241028-18:55:16 epoch_duration 36min22s next_finish 19:31:38 20241028-18:55:16 wrote state.pth 20241028-18:55:16 --- epoch 19 ---------------------------------------- 20241028-18:55:16 current_test_accuracies 0.9640 20241028-18:55:16 no_c_quiz 20241028-18:55:16 weakest_accuracies [0.964] 20241028-18:55:16 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-19:30:14 train_loss 19 model 0 0.030214839967489242 20241028-19:30:14 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-19:30:36 test_loss 19 model 0 0.026370139230042697 20241028-19:30:36 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-19:30:58 test_accuracy 19 model 0 nb_correct 2394 / 2500 (95.76%) 20241028-19:30:58 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-19:31:39 wrote ae_*.pth 20241028-19:31:39 epoch_duration 36min23s next_finish 20:08:02 20241028-19:31:39 wrote state.pth 20241028-19:31:39 --- epoch 20 ---------------------------------------- 20241028-19:31:39 current_test_accuracies 0.9576 20241028-19:31:39 no_c_quiz 20241028-19:31:39 weakest_accuracies [0.9576] 20241028-19:31:39 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-20:06:37 train_loss 20 model 0 0.029098679245710374 20241028-20:06:37 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-20:06:59 test_loss 20 model 0 0.020736786079406738 20241028-20:06:59 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-20:07:21 test_accuracy 20 model 0 nb_correct 2419 / 2500 (96.76%) 20241028-20:07:21 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-20:08:02 wrote ae_*.pth 20241028-20:08:02 epoch_duration 36min23s next_finish 20:44:25 20241028-20:08:02 wrote state.pth 20241028-20:08:02 --- epoch 21 ---------------------------------------- 20241028-20:08:02 current_test_accuracies 0.9676 20241028-20:08:02 no_c_quiz 20241028-20:08:02 weakest_accuracies [0.9676] 20241028-20:08:02 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-20:43:00 train_loss 21 model 0 0.028974518743157388 20241028-20:43:00 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-20:43:22 test_loss 21 model 0 0.024240348474681376 20241028-20:43:22 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-20:43:44 test_accuracy 21 model 0 nb_correct 2433 / 2500 (97.32%) 20241028-20:43:44 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-20:44:26 wrote ae_*.pth 20241028-20:44:26 epoch_duration 36min23s next_finish 21:20:50 20241028-20:44:26 wrote state.pth 20241028-20:44:26 --- epoch 22 ---------------------------------------- 20241028-20:44:26 current_test_accuracies 0.9732 20241028-20:44:26 no_c_quiz 20241028-20:44:26 weakest_accuracies [0.9732] 20241028-20:44:26 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-21:19:24 train_loss 22 model 0 0.027981189906299116 20241028-21:19:24 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-21:19:46 test_loss 22 model 0 0.021338434851169586 20241028-21:19:46 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-21:20:08 test_accuracy 22 model 0 nb_correct 2443 / 2500 (97.72%) 20241028-21:20:08 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-21:20:49 wrote ae_*.pth 20241028-21:20:49 epoch_duration 36min23s next_finish 21:57:13 20241028-21:20:49 wrote state.pth 20241028-21:20:49 --- epoch 23 ---------------------------------------- 20241028-21:20:49 current_test_accuracies 0.9772 20241028-21:20:49 no_c_quiz 20241028-21:20:49 weakest_accuracies [0.9772] 20241028-21:20:49 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-21:55:48 train_loss 23 model 0 0.027936550604701044 20241028-21:55:48 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-21:56:10 test_loss 23 model 0 0.025244058602303266 20241028-21:56:10 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-21:56:32 test_accuracy 23 model 0 nb_correct 2433 / 2500 (97.32%) 20241028-21:56:32 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-21:57:13 wrote ae_*.pth 20241028-21:57:13 epoch_duration 36min23s next_finish 22:33:36 20241028-21:57:13 wrote state.pth 20241028-21:57:13 --- epoch 24 ---------------------------------------- 20241028-21:57:13 current_test_accuracies 0.9732 20241028-21:57:13 no_c_quiz 20241028-21:57:13 weakest_accuracies [0.9732] 20241028-21:57:13 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-22:32:11 train_loss 24 model 0 0.027611496338099242 20241028-22:32:11 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-22:32:33 test_loss 24 model 0 0.026861053079366683 20241028-22:32:33 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-22:32:55 test_accuracy 24 model 0 nb_correct 2407 / 2500 (96.28%) 20241028-22:32:55 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-22:33:37 wrote ae_*.pth 20241028-22:33:37 epoch_duration 36min24s next_finish 23:10:02 20241028-22:33:37 wrote state.pth 20241028-22:33:37 --- epoch 25 ---------------------------------------- 20241028-22:33:37 current_test_accuracies 0.9628 20241028-22:33:37 no_c_quiz 20241028-22:33:37 weakest_accuracies [0.9628] 20241028-22:33:37 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-23:08:37 train_loss 25 model 0 0.027350280060768128 20241028-23:08:37 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-23:08:59 test_loss 25 model 0 0.019786274136602878 20241028-23:08:59 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-23:09:21 test_accuracy 25 model 0 nb_correct 2438 / 2500 (97.52%) 20241028-23:09:21 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-23:10:02 wrote ae_*.pth 20241028-23:10:02 epoch_duration 36min24s next_finish 23:46:27 20241028-23:10:02 wrote state.pth 20241028-23:10:02 --- epoch 26 ---------------------------------------- 20241028-23:10:02 current_test_accuracies 0.9752 20241028-23:10:02 no_c_quiz 20241028-23:10:02 weakest_accuracies [0.9752] 20241028-23:10:02 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241028-23:45:01 train_loss 26 model 0 0.027426436398625374 20241028-23:45:01 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-23:45:23 test_loss 26 model 0 0.02028329553902149 20241028-23:45:23 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241028-23:45:45 test_accuracy 26 model 0 nb_correct 2447 / 2500 (97.88%) 20241028-23:45:45 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241028-23:46:26 wrote ae_*.pth 20241028-23:46:26 epoch_duration 36min23s next_finish 00:22:50 20241028-23:46:26 wrote state.pth 20241028-23:46:26 --- epoch 27 ---------------------------------------- 20241028-23:46:26 current_test_accuracies 0.9788 20241028-23:46:26 no_c_quiz 20241028-23:46:26 weakest_accuracies [0.9788] 20241028-23:46:26 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-00:21:24 train_loss 27 model 0 0.026744506003707647 20241029-00:21:24 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-00:21:46 test_loss 27 model 0 0.018095414584875107 20241029-00:21:46 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-00:22:08 test_accuracy 27 model 0 nb_correct 2395 / 2500 (95.80%) 20241029-00:22:08 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-00:22:49 wrote ae_*.pth 20241029-00:22:49 epoch_duration 36min23s next_finish 00:59:13 20241029-00:22:49 wrote state.pth 20241029-00:22:49 --- epoch 28 ---------------------------------------- 20241029-00:22:49 current_test_accuracies 0.9580 20241029-00:22:49 no_c_quiz 20241029-00:22:49 weakest_accuracies [0.958] 20241029-00:22:49 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-00:57:47 train_loss 28 model 0 0.02715518419906497 20241029-00:57:47 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-00:58:09 test_loss 28 model 0 0.02104291911125183 20241029-00:58:09 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-00:58:31 test_accuracy 28 model 0 nb_correct 2438 / 2500 (97.52%) 20241029-00:58:31 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-00:59:13 wrote ae_*.pth 20241029-00:59:13 epoch_duration 36min23s next_finish 01:35:37 20241029-00:59:13 wrote state.pth 20241029-00:59:13 --- epoch 29 ---------------------------------------- 20241029-00:59:13 current_test_accuracies 0.9752 20241029-00:59:13 no_c_quiz 20241029-00:59:13 weakest_accuracies [0.9752] 20241029-00:59:13 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-01:34:11 train_loss 29 model 0 0.02582126382946968 20241029-01:34:11 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-01:34:33 test_loss 29 model 0 0.019512227084487677 20241029-01:34:33 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-01:34:55 test_accuracy 29 model 0 nb_correct 2459 / 2500 (98.36%) 20241029-01:34:55 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-01:35:36 wrote ae_*.pth 20241029-01:35:36 epoch_duration 36min22s next_finish 02:11:59 20241029-01:35:36 wrote state.pth 20241029-01:35:36 --- epoch 30 ---------------------------------------- 20241029-01:35:36 current_test_accuracies 0.9836 20241029-01:35:36 no_c_quiz 20241029-01:35:36 weakest_accuracies [0.9836] 20241029-01:35:36 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-02:10:35 train_loss 30 model 0 0.025737308361083268 20241029-02:10:35 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-02:10:57 test_loss 30 model 0 0.022195719835162164 20241029-02:10:57 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-02:11:19 test_accuracy 30 model 0 nb_correct 2454 / 2500 (98.16%) 20241029-02:11:19 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-02:12:00 wrote ae_*.pth 20241029-02:12:00 epoch_duration 36min23s next_finish 02:48:23 20241029-02:12:00 wrote state.pth 20241029-02:12:00 --- epoch 31 ---------------------------------------- 20241029-02:12:00 current_test_accuracies 0.9816 20241029-02:12:00 no_c_quiz 20241029-02:12:00 weakest_accuracies [0.9816] 20241029-02:12:00 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-02:46:58 train_loss 31 model 0 0.025875775410607458 20241029-02:46:58 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-02:47:20 test_loss 31 model 0 0.021579846171289684 20241029-02:47:20 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-02:47:42 test_accuracy 31 model 0 nb_correct 2449 / 2500 (97.96%) 20241029-02:47:42 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-02:48:22 wrote ae_*.pth 20241029-02:48:22 epoch_duration 36min22s next_finish 03:24:44 20241029-02:48:22 wrote state.pth 20241029-02:48:22 --- epoch 32 ---------------------------------------- 20241029-02:48:22 current_test_accuracies 0.9796 20241029-02:48:22 no_c_quiz 20241029-02:48:22 weakest_accuracies [0.9796] 20241029-02:48:22 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-03:23:20 train_loss 32 model 0 0.02577271026492119 20241029-03:23:20 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-03:23:42 test_loss 32 model 0 0.01774372440315783 20241029-03:23:42 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-03:24:04 test_accuracy 32 model 0 nb_correct 2436 / 2500 (97.44%) 20241029-03:24:04 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-03:24:45 wrote ae_*.pth 20241029-03:24:45 epoch_duration 36min23s next_finish 04:01:09 20241029-03:24:45 wrote state.pth 20241029-03:24:45 --- epoch 33 ---------------------------------------- 20241029-03:24:45 current_test_accuracies 0.9744 20241029-03:24:45 no_c_quiz 20241029-03:24:45 weakest_accuracies [0.9744] 20241029-03:24:46 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-03:59:44 train_loss 33 model 0 0.025309531951621174 20241029-03:59:44 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-04:00:06 test_loss 33 model 0 0.02059392285179347 20241029-04:00:06 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-04:00:28 test_accuracy 33 model 0 nb_correct 2436 / 2500 (97.44%) 20241029-04:00:28 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-04:01:08 wrote ae_*.pth 20241029-04:01:08 epoch_duration 36min22s next_finish 04:37:31 20241029-04:01:08 wrote state.pth 20241029-04:01:08 --- epoch 34 ---------------------------------------- 20241029-04:01:08 current_test_accuracies 0.9744 20241029-04:01:08 no_c_quiz 20241029-04:01:08 weakest_accuracies [0.9744] 20241029-04:01:08 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-04:36:07 train_loss 34 model 0 0.02563663623265922 20241029-04:36:07 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-04:36:28 test_loss 34 model 0 0.02229537423476577 20241029-04:36:28 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-04:36:51 test_accuracy 34 model 0 nb_correct 2473 / 2500 (98.92%) 20241029-04:36:51 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-04:37:32 wrote ae_*.pth 20241029-04:37:32 epoch_duration 36min23s next_finish 05:13:55 20241029-04:37:32 wrote state.pth 20241029-04:37:32 --- epoch 35 ---------------------------------------- 20241029-04:37:32 current_test_accuracies 0.9892 20241029-04:37:32 no_c_quiz 20241029-04:37:32 weakest_accuracies [0.9892] 20241029-04:37:32 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-05:12:30 train_loss 35 model 0 0.025089174215234815 20241029-05:12:30 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-05:12:52 test_loss 35 model 0 0.01754548028483987 20241029-05:12:52 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-05:13:14 test_accuracy 35 model 0 nb_correct 2451 / 2500 (98.04%) 20241029-05:13:14 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-05:13:56 wrote ae_*.pth 20241029-05:13:56 epoch_duration 36min24s next_finish 05:50:20 20241029-05:13:56 wrote state.pth 20241029-05:13:56 --- epoch 36 ---------------------------------------- 20241029-05:13:56 current_test_accuracies 0.9804 20241029-05:13:56 no_c_quiz 20241029-05:13:56 weakest_accuracies [0.9804] 20241029-05:13:56 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-05:48:54 train_loss 36 model 0 0.02449174146711826 20241029-05:48:54 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-05:49:16 test_loss 36 model 0 0.02697692085802555 20241029-05:49:16 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-05:49:38 test_accuracy 36 model 0 nb_correct 2430 / 2500 (97.20%) 20241029-05:49:38 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-05:50:21 wrote ae_*.pth 20241029-05:50:21 epoch_duration 36min24s next_finish 06:26:45 20241029-05:50:21 wrote state.pth 20241029-05:50:21 --- epoch 37 ---------------------------------------- 20241029-05:50:21 current_test_accuracies 0.9720 20241029-05:50:21 no_c_quiz 20241029-05:50:21 weakest_accuracies [0.972] 20241029-05:50:21 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-06:25:19 train_loss 37 model 0 0.024803437894508243 20241029-06:25:19 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-06:25:41 test_loss 37 model 0 0.02272323981821537 20241029-06:25:41 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-06:26:03 test_accuracy 37 model 0 nb_correct 2461 / 2500 (98.44%) 20241029-06:26:03 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-06:26:46 wrote ae_*.pth 20241029-06:26:46 epoch_duration 36min25s next_finish 07:03:11 20241029-06:26:46 wrote state.pth 20241029-06:26:46 --- epoch 38 ---------------------------------------- 20241029-06:26:46 current_test_accuracies 0.9844 20241029-06:26:46 no_c_quiz 20241029-06:26:46 weakest_accuracies [0.9844] 20241029-06:26:46 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-07:01:43 train_loss 38 model 0 0.024775377303287386 20241029-07:01:43 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-07:02:05 test_loss 38 model 0 0.023332971338927744 20241029-07:02:05 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-07:02:27 test_accuracy 38 model 0 nb_correct 2462 / 2500 (98.48%) 20241029-07:02:27 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-07:03:09 wrote ae_*.pth 20241029-07:03:09 epoch_duration 36min23s next_finish 07:39:32 20241029-07:03:09 wrote state.pth 20241029-07:03:09 --- epoch 39 ---------------------------------------- 20241029-07:03:09 current_test_accuracies 0.9848 20241029-07:03:09 no_c_quiz 20241029-07:03:09 weakest_accuracies [0.9848] 20241029-07:03:09 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-07:38:07 train_loss 39 model 0 0.024541010756343604 20241029-07:38:07 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-07:38:29 test_loss 39 model 0 0.020432739239186048 20241029-07:38:29 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-07:38:51 test_accuracy 39 model 0 nb_correct 2454 / 2500 (98.16%) 20241029-07:38:51 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-07:39:33 wrote ae_*.pth 20241029-07:39:33 epoch_duration 36min23s next_finish 08:15:56 20241029-07:39:33 wrote state.pth 20241029-07:39:33 --- epoch 40 ---------------------------------------- 20241029-07:39:33 current_test_accuracies 0.9816 20241029-07:39:33 no_c_quiz 20241029-07:39:33 weakest_accuracies [0.9816] 20241029-07:39:33 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-08:14:31 train_loss 40 model 0 0.024159517689570784 20241029-08:14:31 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-08:14:53 test_loss 40 model 0 0.01949647225923836 20241029-08:14:53 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-08:15:15 test_accuracy 40 model 0 nb_correct 2467 / 2500 (98.68%) 20241029-08:15:15 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-08:15:55 wrote ae_*.pth 20241029-08:15:55 epoch_duration 36min22s next_finish 08:52:18 20241029-08:15:55 wrote state.pth 20241029-08:15:55 --- epoch 41 ---------------------------------------- 20241029-08:15:55 current_test_accuracies 0.9868 20241029-08:15:55 no_c_quiz 20241029-08:15:55 weakest_accuracies [0.9868] 20241029-08:15:55 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-08:50:54 train_loss 41 model 0 0.02428929205417633 20241029-08:50:54 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-08:51:15 test_loss 41 model 0 0.01730190966054797 20241029-08:51:15 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-08:51:38 test_accuracy 41 model 0 nb_correct 2466 / 2500 (98.64%) 20241029-08:51:38 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-08:52:19 wrote ae_*.pth 20241029-08:52:19 epoch_duration 36min23s next_finish 09:28:43 20241029-08:52:19 wrote state.pth 20241029-08:52:19 --- epoch 42 ---------------------------------------- 20241029-08:52:19 current_test_accuracies 0.9864 20241029-08:52:19 no_c_quiz 20241029-08:52:19 weakest_accuracies [0.9864] 20241029-08:52:19 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-09:27:17 train_loss 42 model 0 0.023838982805497944 20241029-09:27:17 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-09:27:39 test_loss 42 model 0 0.021008705668151377 20241029-09:27:39 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-09:28:01 test_accuracy 42 model 0 nb_correct 2452 / 2500 (98.08%) 20241029-09:28:01 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-09:28:42 wrote ae_*.pth 20241029-09:28:42 epoch_duration 36min22s next_finish 10:05:05 20241029-09:28:42 wrote state.pth 20241029-09:28:42 --- epoch 43 ---------------------------------------- 20241029-09:28:42 current_test_accuracies 0.9808 20241029-09:28:42 no_c_quiz 20241029-09:28:42 weakest_accuracies [0.9808] 20241029-09:28:42 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-10:03:40 train_loss 43 model 0 0.023919531135484576 20241029-10:03:40 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-10:04:02 test_loss 43 model 0 0.01920623355396092 20241029-10:04:02 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-10:04:24 test_accuracy 43 model 0 nb_correct 2453 / 2500 (98.12%) 20241029-10:04:24 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-10:05:05 wrote ae_*.pth 20241029-10:05:05 epoch_duration 36min23s next_finish 10:41:28 20241029-10:05:05 wrote state.pth 20241029-10:05:05 --- epoch 44 ---------------------------------------- 20241029-10:05:05 current_test_accuracies 0.9812 20241029-10:05:05 no_c_quiz 20241029-10:05:05 weakest_accuracies [0.9812] 20241029-10:05:05 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-10:40:03 train_loss 44 model 0 0.024434394002631307 20241029-10:40:03 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-10:40:25 test_loss 44 model 0 0.01839964100494981 20241029-10:40:25 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-10:40:47 test_accuracy 44 model 0 nb_correct 2454 / 2500 (98.16%) 20241029-10:40:47 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-10:41:27 wrote ae_*.pth 20241029-10:41:27 epoch_duration 36min21s next_finish 11:17:49 20241029-10:41:27 wrote state.pth 20241029-10:41:27 --- epoch 45 ---------------------------------------- 20241029-10:41:27 current_test_accuracies 0.9816 20241029-10:41:27 no_c_quiz 20241029-10:41:27 weakest_accuracies [0.9816] 20241029-10:41:27 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-11:16:25 train_loss 45 model 0 0.02424537214126438 20241029-11:16:25 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-11:16:47 test_loss 45 model 0 0.020239756659418344 20241029-11:16:47 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-11:17:09 test_accuracy 45 model 0 nb_correct 2459 / 2500 (98.36%) 20241029-11:17:09 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-11:17:50 wrote ae_*.pth 20241029-11:17:50 epoch_duration 36min23s next_finish 11:54:14 20241029-11:17:50 wrote state.pth 20241029-11:17:50 --- epoch 46 ---------------------------------------- 20241029-11:17:50 current_test_accuracies 0.9836 20241029-11:17:50 no_c_quiz 20241029-11:17:50 weakest_accuracies [0.9836] 20241029-11:17:50 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-11:52:49 train_loss 46 model 0 0.024164685086347164 20241029-11:52:49 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-11:53:11 test_loss 46 model 0 0.016819394004298376 20241029-11:53:11 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-11:53:33 test_accuracy 46 model 0 nb_correct 2466 / 2500 (98.64%) 20241029-11:53:33 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-11:54:14 wrote ae_*.pth 20241029-11:54:14 epoch_duration 36min23s next_finish 12:30:37 20241029-11:54:14 wrote state.pth 20241029-11:54:14 --- epoch 47 ---------------------------------------- 20241029-11:54:14 current_test_accuracies 0.9864 20241029-11:54:14 no_c_quiz 20241029-11:54:14 weakest_accuracies [0.9864] 20241029-11:54:14 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-12:29:12 train_loss 47 model 0 0.02398436620980501 20241029-12:29:12 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-12:29:34 test_loss 47 model 0 0.024748345467448234 20241029-12:29:34 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-12:29:56 test_accuracy 47 model 0 nb_correct 2465 / 2500 (98.60%) 20241029-12:29:56 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-12:30:38 wrote ae_*.pth 20241029-12:30:38 epoch_duration 36min23s next_finish 13:07:02 20241029-12:30:38 wrote state.pth 20241029-12:30:38 --- epoch 48 ---------------------------------------- 20241029-12:30:38 current_test_accuracies 0.9860 20241029-12:30:38 no_c_quiz 20241029-12:30:38 weakest_accuracies [0.986] 20241029-12:30:38 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-13:05:36 train_loss 48 model 0 0.024450543616861106 20241029-13:05:36 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-13:05:58 test_loss 48 model 0 0.022123433448467403 20241029-13:05:58 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-13:06:20 test_accuracy 48 model 0 nb_correct 2456 / 2500 (98.24%) 20241029-13:06:20 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-13:07:01 wrote ae_*.pth 20241029-13:07:01 epoch_duration 36min23s next_finish 13:43:25 20241029-13:07:01 wrote state.pth 20241029-13:07:01 --- epoch 49 ---------------------------------------- 20241029-13:07:01 current_test_accuracies 0.9824 20241029-13:07:01 no_c_quiz 20241029-13:07:01 weakest_accuracies [0.9824] 20241029-13:07:01 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-13:41:59 train_loss 49 model 0 0.023388983907401562 20241029-13:41:59 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-13:42:21 test_loss 49 model 0 0.016699708539247512 20241029-13:42:21 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-13:42:43 test_accuracy 49 model 0 nb_correct 2461 / 2500 (98.44%) 20241029-13:42:43 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-13:43:24 wrote ae_*.pth 20241029-13:43:24 epoch_duration 36min23s next_finish 14:19:48 20241029-13:43:24 wrote state.pth 20241029-13:43:24 --- epoch 50 ---------------------------------------- 20241029-13:43:24 current_test_accuracies 0.9844 20241029-13:43:24 no_c_quiz 20241029-13:43:24 weakest_accuracies [0.9844] 20241029-13:43:24 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-14:18:23 train_loss 50 model 0 0.02343058091722429 20241029-14:18:23 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-14:18:45 test_loss 50 model 0 0.026390923806000503 20241029-14:18:45 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-14:19:07 test_accuracy 50 model 0 nb_correct 2467 / 2500 (98.68%) 20241029-14:19:07 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-14:19:48 wrote ae_*.pth 20241029-14:19:48 epoch_duration 36min23s next_finish 14:56:12 20241029-14:19:48 wrote state.pth 20241029-14:19:48 --- epoch 51 ---------------------------------------- 20241029-14:19:48 current_test_accuracies 0.9868 20241029-14:19:48 no_c_quiz 20241029-14:19:48 weakest_accuracies [0.9868] 20241029-14:19:48 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-14:54:46 train_loss 51 model 0 0.023969386631716043 20241029-14:54:46 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-14:55:08 test_loss 51 model 0 0.017592001776397227 20241029-14:55:08 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-14:55:30 test_accuracy 51 model 0 nb_correct 2449 / 2500 (97.96%) 20241029-14:55:30 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-14:56:12 wrote ae_*.pth 20241029-14:56:12 epoch_duration 36min23s next_finish 15:32:36 20241029-14:56:12 wrote state.pth 20241029-14:56:12 --- epoch 52 ---------------------------------------- 20241029-14:56:12 current_test_accuracies 0.9796 20241029-14:56:12 no_c_quiz 20241029-14:56:12 weakest_accuracies [0.9796] 20241029-14:56:12 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-15:31:09 train_loss 52 model 0 0.023756297306232153 20241029-15:31:09 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-15:31:31 test_loss 52 model 0 0.01856003186516464 20241029-15:31:31 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-15:31:53 test_accuracy 52 model 0 nb_correct 2465 / 2500 (98.60%) 20241029-15:31:53 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-15:32:34 wrote ae_*.pth 20241029-15:32:34 epoch_duration 36min22s next_finish 16:08:57 20241029-15:32:34 wrote state.pth 20241029-15:32:34 --- epoch 53 ---------------------------------------- 20241029-15:32:34 current_test_accuracies 0.9860 20241029-15:32:34 no_c_quiz 20241029-15:32:34 weakest_accuracies [0.986] 20241029-15:32:34 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-16:07:33 train_loss 53 model 0 0.023055713625419885 20241029-16:07:33 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-16:07:55 test_loss 53 model 0 0.01808455322794616 20241029-16:07:55 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-16:08:17 test_accuracy 53 model 0 nb_correct 2454 / 2500 (98.16%) 20241029-16:08:17 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-16:08:58 wrote ae_*.pth 20241029-16:08:58 epoch_duration 36min23s next_finish 16:45:21 20241029-16:08:58 wrote state.pth 20241029-16:08:58 --- epoch 54 ---------------------------------------- 20241029-16:08:58 current_test_accuracies 0.9816 20241029-16:08:58 no_c_quiz 20241029-16:08:58 weakest_accuracies [0.9816] 20241029-16:08:58 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-16:43:55 train_loss 54 model 0 0.02318080147534609 20241029-16:43:55 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-16:44:17 test_loss 54 model 0 0.017535675332229585 20241029-16:44:17 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-16:44:39 test_accuracy 54 model 0 nb_correct 2461 / 2500 (98.44%) 20241029-16:44:39 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-16:45:20 wrote ae_*.pth 20241029-16:45:20 epoch_duration 36min21s next_finish 17:21:41 20241029-16:45:20 wrote state.pth 20241029-16:45:20 --- epoch 55 ---------------------------------------- 20241029-16:45:20 current_test_accuracies 0.9844 20241029-16:45:20 no_c_quiz 20241029-16:45:20 weakest_accuracies [0.9844] 20241029-16:45:20 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0 20241029-17:20:18 train_loss 55 model 0 0.023381758998781442 20241029-17:20:18 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-17:20:40 test_loss 55 model 0 0.02016963384952396 20241029-17:20:40 quiz_set nb_w_quizzes 2500 nb_c_quizzes 0 20241029-17:21:02 test_accuracy 55 model 0 nb_correct 2457 / 2500 (98.28%) 20241029-17:21:02 quiz_set nb_w_quizzes 150 nb_c_quizzes 0 20241029-17:21:42 wrote ae_*.pth 20241029-17:21:42 epoch_duration 36min22s next_finish 17:58:05 20241029-17:21:42 wrote state.pth 20241029-17:21:42 --- epoch 56 ---------------------------------------- 20241029-17:21:42 current_test_accuracies 0.9828 20241029-17:21:42 no_c_quiz 20241029-17:21:42 weakest_accuracies [0.9828] 20241029-17:21:42 quiz_set nb_w_quizzes 50000 nb_c_quizzes 0