#!/bin/bash
FILE=$1
OUT=$2

gunzip $FILE -c | \
cut -f 2,9-11,14,15,17,34 -d $'\t' | \
uniq | \
awk -F$'\t' 'BEGIN{OFS = FS} $5  != "single base substitution" {print $0}' | \
awk -F $'\t' 'BEGIN{OFS = FS} $8 == "WGS" {print $2, $3-1, $4, $6, $7, $1}' | \
sort -V -k1,1 -k2,2 | bgzip -c > $OUT && \
# | head -n 11307`
# awk -F $'\t' 'BEGIN{OFS=FS} $6 == "DO220846" {print $0}'
# awk -F $'\t' 'BEGIN{OFS=FS} $6 == "DO222843" {print $0}'


# | awk -F$'\t' 'BEGIN{OFS = FS} $6  == "single base substitution" {print $0}' | awk -F $'\t' 'BEGIN{OFS = FS} $8 == "WGS" {print $2, $3-1, $4, $6, $7, $1}' | sort -V -k1,1 -k2,2
# gunzip $FILE -c | cut -f 2,9-11,14,15,17,34 -d $'\t' | uniq | awk -F$'\t' 'BEGIN{OFS = FS} $5  == "single base substitution" {print $0}' | awk -F $'\t' 'BEGIN{OFS = FS} $8 == "WGS" {print $2, $3-1, $4, $6, $7, $1}' | sort -V -k1,1 -k2,2 | bgzip -c > $OUT && \

tabix -p bed $OUT
