import os 
from config_base import *

STRING_DIR = os.path.join(DATA_DIR, "STRING")
v11_DIR = os.path.join(STRING_DIR, "v11")
v12_DIR = os.path.join(STRING_DIR, "v12")

PAIRS_DIR = os.path.join(v12_DIR, "pairs")
PROCESSED_DIR = os.path.join(v12_DIR, "processed")

FASTA_FILE = os.path.join(v12_DIR, "9606.protein.sequences.v12.0.fa.gz")
STRING_FILE = os.path.join(v12_DIR, "9606.protein.physical.links.detailed.v12.0.txt")
CDHIT_CLUSTER_FILE = os.path.join(PROCESSED_DIR, "clustered_9606.clstr")

OUTPUT_POS = os.path.join(PAIRS_DIR, "pos_pairs.tsv")
OUTPUT_NEG = os.path.join(PAIRS_DIR, "neg_pairs.tsv")
OUTPUT_COMBINED = os.path.join(PAIRS_DIR, "combined_pairs.tsv")

EXPERIMENT_THRESHOLD = 0
NEGATIVE_MULTIPLIER = 10

v11_fasta = os.path.join(v11_DIR, "9606.protein.sequences.v11.0.fa")
v12_fasta = os.path.join(v12_DIR, "9606.protein.sequences.v12.0.fa")
ppi_file = V11_FILE

filtered_v11 = os.path.join(v11_DIR, "filtered_v11_sequences.fa")
filtered_v12 = os.path.join(v12_DIR, "processed", "filtered_v12_only_sequences.fa")
combined_fasta = os.path.join(v11_DIR, "filtered_sequences.fa")