import os,glob, subprocess, re, argparse
os.environ['HF_HOME'] = "checkpoints"
from huggingface_hub import login
#
from datasets import load_dataset
from datasets import concatenate_datasets
from transformers import AutoModelForSeq2SeqLM
from transformers import AutoModelForCausalLM, AutoTokenizer, TrainingArguments, AutoModelForSeq2SeqLM
from transformers import T5Tokenizer, T5ForConditionalGeneration

# model = AutoModelForSeq2SeqLM.from_pretrained("google/flan-t5-small")
# for qwen_size in ['base']:
#     model_name = f"google/flan-t5-{qwen_size}"
#     tokenizer = AutoTokenizer.from_pretrained(model_name)
#     model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
#     print(tokenizer.pad_token)

model_name = "deepseek-ai/deepseek-llm-7b-chat"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForCausalLM.from_pretrained(model_name)
print(tokenizer.encode('bgfn Assistant:'))
print(tokenizer.encode('Hello! Can you say yes? '))
print(tokenizer.encode('Hello! Can you say yes?\nAssistant: Yes.'))
print(tokenizer.encode('Hello! Can you say yes.\nAssistant: Hell yeah.'))
print(tokenizer.pad_token)
# for i in ['sst2','cola','rte','qnli','mrpc','wnli','qqp','mnli']:
    # dataset_test = load_dataset("nyu-mll/glue", i)
# for i in ['small','base','large','xl']:
#     ckpt = f'google/t5-v1_1-{i}'
#     model = AutoModelForSeq2SeqLM.from_pretrained(ckpt)
    # ds_train = load_dataset("google/code_x_glue_cc_clone_detection_big_clone_bench", split='train')
    # ds_val = load_dataset("google/code_x_glue_cc_clone_detection_big_clone_bench", split='validation')

# d_l = ['python', 'java']
# ds_trains = [load_dataset("google/code_x_glue_ct_code_to_text", i, split='train') for i in d_l]
# ds_vals = [load_dataset("google/code_x_glue_ct_code_to_text", i, split='validation') for i in d_l]
# ds_train, ds_val = concatenate_datasets(ds_trains), concatenate_datasets(ds_vals)

# ds_train = load_dataset("google/code_x_glue_tc_text_to_code", split='train')
# ds_val = load_dataset("google/code_x_glue_tc_text_to_code", split='validation')

# ds_train = load_dataset("google/code_x_glue_cc_defect_detection", split='train')
# ds_val = load_dataset("google/code_x_glue_cc_defect_detection", split='validation')
    