type = str, default = 'train.log')
parser.add_argument('--download',
- type = bool, default = False)
+ action='store_true', default = False)
parser.add_argument('--seed',
type = int, default = 0)
type = float, default = 0.1)
parser.add_argument('--synthesis_sampling',
- type = bool, default = True)
+ action='store_true', default = True)
parser.add_argument('--checkpoint_name',
type = str, default = 'checkpoint.pth')
+parser.add_argument('--picoclvr_many_colors',
+ action='store_true', default = False)
+
######################################################################
args = parser.parse_args()
elif args.data == 'mnist':
task = TaskMNIST(batch_size = args.batch_size, device = device)
elif args.data == 'picoclvr':
- task = TaskPicoCLVR(batch_size = args.batch_size, device = device)
+ task = TaskPicoCLVR(batch_size = args.batch_size, many_colors = args.picoclvr_many_colors, device = device)
else:
raise ValueError(f'Unknown dataset {args.data}.')
######################################################################
+def all_properties(height, width, nb_squares, square_i, square_j, square_c):
+ s = [ ]
+
+ for r, c in [ (k, color_names[square_c[k]]) for k in range(nb_squares) ]:
+ s += [ f'there is {c}' ]
+
+ if square_i[r] >= height - height//3: s += [ f'{c} bottom' ]
+ if square_i[r] < height//3: s += [ f'{c} top' ]
+ if square_j[r] >= width - width//3: s += [ f'{c} right' ]
+ if square_j[r] < width//3: s += [ f'{c} left' ]
+
+ for t, d in [ (k, color_names[square_c[k]]) for k in range(nb_squares) ]:
+ if square_i[r] > square_i[t]: s += [ f'{c} below {d}' ]
+ if square_i[r] < square_i[t]: s += [ f'{c} above {d}' ]
+ if square_j[r] > square_j[t]: s += [ f'{c} right of {d}' ]
+ if square_j[r] < square_j[t]: s += [ f'{c} left of {d}' ]
+
+ return s
+
def generate(nb, height = 6, width = 8,
max_nb_squares = 5, max_nb_statements = 10,
many_colors = False):
# generates all the true relations
- s = [ ]
-
- for r, c in [ (k, color_names[square_c[k]]) for k in range(nb_squares) ]:
- s += [ f'there is {c}' ]
-
- if square_i[r] >= height - height//3: s += [ f'{c} bottom' ]
- if square_i[r] < height//3: s += [ f'{c} top' ]
- if square_j[r] >= width - width//3: s += [ f'{c} right' ]
- if square_j[r] < width//3: s += [ f'{c} left' ]
-
- for t, d in [ (k, color_names[square_c[k]]) for k in range(nb_squares) ]:
- if square_i[r] > square_i[t]: s += [ f'{c} below {d}' ]
- if square_i[r] < square_i[t]: s += [ f'{c} above {d}' ]
- if square_j[r] > square_j[t]: s += [ f'{c} right of {d}' ]
- if square_j[r] < square_j[t]: s += [ f'{c} left of {d}' ]
+ s = all_properties(height, width, nb_squares, square_i, square_j, square_c)
# pick at most max_nb_statements at random