clustering:
  input_csv: data/vanilla_1000/vanilla_1000.csv
  output_csv: data/clustering/vanilla_300_clustered.csv
  cluster_map_csv: data/clustering/vanilla_300_cluster_map.csv
  k: 300

embedding:
  model: text-embedding-3-large
  batch_size: 50
  cache_path: data/clustering/vanilla_embedding_cache.json