batch_size: 3072
num_iterations: 500
num_descriptors: 2
num_centroids: 40000

descriptor_type: clip
scorer_type: clip
num_flip: 1
num_category: 512
seed: 0

init_random: True
crossover_proportion: 0.
crossover_type: k_points
k_points: 0

log_freq: 10
log_image_freq: 100
num_plot_centroids_per_ax: [7, 7]

#vq-vae architecture
num_hiddens: 128
num_residual_hiddens: 64
num_residual_layers: 2
latent_map_size: [8, 8]

clip_descriptors_text: ["a red truck", "a blue truck"]
clip_scoring_text: ["a truck"]
clip_descriptors_range: [2.7, 6.5]

#dataset parameters
image_size: [128, 128, 3]
