$schema: https://azuremlschemas.azureedge.net/latest/pipelineJob.schema.json
type: pipeline
display_name: SST2-dp-sweep
experiment_name: auditing-synthetic-text-generation

settings:
  default_compute: azureml:ND40rsv2

inputs:
  model_path:
    type: uri_folder
    path: "azureml:Mistral-7B-v0point1:1"
  train_data_path:
    type: uri_folder
    path: "azureml:SST2-train:3"
  eval_data_path:
    type: uri_folder
    path: "azureml:SST2-test:3"

jobs:
  preprocess:
    type: command
    component: ./components/preprocess_for_synthesizer/component_spec.yml
    inputs:
      train_data_path: ${{parent.inputs.train_data_path}}
      eval_data_path: ${{parent.inputs.eval_data_path}}
      templated_prompt: "A sentence with a {label} sentiment: "
      label_column: "label"
      text_column: "sentence"
    outputs:
      train_data:
        mode: "rw_mount"
      eval_data:
        mode: "rw_mount"
  fine_tune:
    type: sweep
    inputs:
      train_data_path: ${{parent.jobs.preprocess.outputs.train_data}}
      eval_data_path: ${{parent.jobs.preprocess.outputs.eval_data}}
      evaluation_strategy: "steps"
      eval_steps: 10
      label_names: "labels"
      model_path: ${{parent.inputs.model_path}}
      nproc_per_node: 8
      sequence_len: 128
      per_device_train_batch_size: 128
      seed: 239023
      chat_format: False
      target_epsilon: 8
      target_delta: 1e-5
      num_train_epochs: 3.0
      bf16: false
      fp16: false
    outputs:
      output_dir:
        mode: "rw_mount"
    sampling_algorithm: grid
    trial: ../../components/dp_fine_tune_LLM_w_qlora/component_spec.yml
    search_space:
      gradient_accumulation_steps:
        type: "choice"
        values: [1, 2, 4]
      learning_rate:
        type: "choice"
        values: [1e-6, 6e-6, 4e-5, 3e-4, 2e-3, 1e-2]
      per_sample_max_grad_norm:
        type: "choice"
        values: [1e-1, 1, 2]
    objective:
      primary_metric: "eval_loss"
      goal: "minimize"
    limits:
      max_total_trials: 54
  generate:
    type: command
    component: ../../components/llm-synthetic-data-generation/component_spec.yml
    inputs:
      lora_path: ${{parent.jobs.fine_tune.outputs.output_dir}}
      model_path: ${{parent.inputs.model_path}}
      train_data_path: ${{parent.jobs.preprocess.outputs.train_data}}
      nproc_per_node: 8
      batch_size: 32
      seed: 2933
      max_new_tokens: 128
      mixed_precision: "no"
    outputs:
      output_dir:
        mode: "rw_mount"
  compute_utility:
    type: command
    component: ./components/utility_computation/component_spec.yml
    inputs:
      nproc_per_node: 8
      model_name: "roberta-base"
      is_synthetic: True
      train_data_path: ${{parent.jobs.generate.outputs.output_dir}}
      train_label_name: "Prompt"
      train_text_name: "Generation"
      eval_data_path: ${{parent.inputs.eval_data_path}}
      eval_label_name: "label"
      eval_text_name: "sentence"
      sequence_len: 128
      per_device_train_batch_size: 8
      gradient_accumulation_steps: 1
      num_train_epochs: 1
      evaluation_strategy: "steps"
      eval_steps: 100
      save_strategy: "no"
      log_level: info
      seed: 239023
      weight_decay: 0.01
      logging_steps: 10
      learning_rate: 3e-5
    outputs:
      output_dir:
        mode: "rw_mount"