set -euo pipefail
. recognizers/functions.bash

usage() {
  echo "Usage: $0 <language-dir> <model-dir> [--plot-attention] [--num-examples N]

Analyze a transformer model's residual stream on a language.
    
  --plot-attention
    Also generate attention pattern plots.
    
  --num-examples N
    Number of examples to analyze (default: 5).
"
}

analysis_args=()
language_dir=""
model_dir=""

# Process positional arguments first
if [ $# -ge 2 ]; then
  language_dir="$1"
  model_dir="$2"
  shift 2
else
  usage >&2
  exit 1
fi

# Process any remaining arguments
while [[ $# -gt 0 ]]; do
  case "$1" in
    --plot-attention)
      analysis_args+=("--plot-attention")
      shift
      ;;
    --num-examples)
      if [ $# -ge 2 ]; then
        analysis_args+=("--num-examples" "$2")
        shift 2
      else
        echo "Error: Missing value for --num-examples" >&2
        usage >&2
        exit 1
      fi
      ;;
    *)
      echo "Unknown option: $1" >&2
      usage >&2
      exit 1
      ;;
  esac
done

datasets=(test training)
# Optional datasets.
for dataset in test-short-held-out test-edit-distance; do
  if [[ -e $language_dir/datasets/$dataset ]]; then
    datasets+=("$dataset")
  fi
done

analysis_dir=$model_dir/analysis
mkdir -p "$analysis_dir"

# Check if this is a transformer model by looking at architecture in metadata
is_transformer=false
metadata_file="$model_dir/model_metadata.json"
if [ -f "$metadata_file" ]; then
  if grep -q '"architecture"[[:space:]]*:[[:space:]]*"transformer"' "$metadata_file"; then
    is_transformer=true
  fi
else
  # If metadata file doesn't exist, create a simple one based on the model structure
  echo "Model metadata file not found. Creating one based on model structure..."
  
  # Check if the model has transformer architecture patterns
  if [ -d "$model_dir/checkpoints" ]; then
    if grep -q "attention" "$model_dir/checkpoints/metadata.json" 2>/dev/null; then
      is_transformer=true
      cat > "$model_dir/model_metadata.json" << EOF
{
  "architecture": "transformer",
  "created_automatically": true
}
EOF
      echo "Created model metadata file indicating transformer architecture."
    fi
  fi
fi

# Run the analysis script if it's a transformer model
if [ "$is_transformer" = true ]; then
  echo "Running transformer analysis..."
  
  python recognizers/neural_networks/analyze_transformer.py \
    --load-model "$model_dir" \
    --data-dir "$language_dir" \
    --datasets "${datasets[@]}" \
    --output "$analysis_dir" \
    "${analysis_args[@]}"
  
  echo "Transformer analysis complete. Results saved to $analysis_dir"
else
  echo "Not a transformer model, skipping transformer analysis."
  exit 1
fi
