batch_size: 560
num_iterations: 500
num_descriptors: 2
num_centroids: 40000

descriptor_type: clip
scorer_type: clip
num_steps: 0
num_category: 512
seed: 0
init_random: True

log_freq: 10
log_image_freq: 100
num_plot_centroids_per_ax: [7, 7]

#GDP-ME parameters
sigma_diag: 100.

#vq-vae architecture
num_hiddens: 128
num_residual_hiddens: 64
num_residual_layers: 2
latent_map_size: [8, 8]

clip_descriptors_text: ["a red truck", "a blue truck"]
clip_scoring_text: ["a truck"]
clip_descriptors_range: [2.7, 6.5]

#dataset parameters
image_size: [128, 128, 3]
