__technical:
  - ${!setenv HF_HOME .  # so as to not include default value later on
  - ${!setenv SAMPLE_TEMPERATURE ${!getenv SAMPLE_TEMPERATURE 1.}}
  - GIT_ID: ${!gitid}
_pb._skp.${-model_options switch USE_MODEL_SHORT}:
  phi35_vi:
    model_id: ${!getenv USE_MODEL_REPO microsoft/Phi-3.5-vision-instruct}
    model_kwargs:
      trust_remote_code: True
    tokenizer_kwargs:
      trust_remote_code: True
      # the following can be 16, I have no idea why, documentation is poor
      num_crops: 4
    _pb._skp.${-model_options switch DATASET_ID}:
      SPAR:
        messages:
          - role: user
            content: '<|image_1|>\nProvide a detailed summary of the image.'
        ${-ds construct evaluation.multimodal_data SceneParsingOcclusion True}:
          floc: ./evaluation/sceneparsing_perturbed_gauss_decolor.pkl
        __technical: ${!setenv SAMPLE_MAX_NEW_TOKS 512}
        stop_on_tokens: [32007, 32001]
        dset_split: validation
save_every: ${!getenv SAMPLE_SAVE_EVERY 256}
dset_id: ${!getenv DATASET_ID}
use_device: ${!getenv USE_DEVICE cuda:0}
n_samples: ${!getenv SAMPLE_NUM_SAMPLES 10}
sampling_kwargs:
  top_p: ${!getenv SAMPLE_TOP_P 0.95}
  top_k: ${!getenv SAMPLE_TOP_K 10}
  temperature: ${!getenv SAMPLE_TEMPERATURE}
  max_new_tokens: ${!getenv SAMPLE_MAX_NEW_TOKS 64}
bs_kwargs:
  num_beams: ${!getenv BS_NUM_BEAMS 10}
  max_new_tokens: ${!getenv SAMPLE_MAX_NEW_TOKS 64}
dset_range_start: ${!getenv DSET_RANGE_START 0}
dset_range_end: ${!getenv DSET_RANGE_END -1}
save_dir: ${!getenv SAMPLE_SAVE_DIR ./sample/04_12_24}/${!getenv DATASET_ID}_${!getenv USE_MODEL_SHORT}_${!getenv SAMPLE_TEMPERATURE}
# don't return them by default: transition probs are calculated anyways, hard to make anythin out of those, not needed for any current algo
return_logits_for_bs: False
pigz_temp_storage: ${!getenv PIGGZ_TEMP_DIR }
return_all_hidden: ${!getenv SAMPLE_RETURN_ALL_HIDDEN False}
ok_beamer: ${!getenv SKIP_BEAM_SEARCH False}
