{"eval_loss": 1.1608266830444336, "eval_accuracy": 0.61, "eval_pred_num_tokens": 17.25, "eval_true_num_tokens": 19.75, "eval_token_set_precision": 0.6072330447330447, "eval_token_set_recall": 0.6363636363636364, "eval_token_set_f1": 0.620899631769197, "eval_token_set_f1_sem": 0.10481871831396225, "eval_n_ngrams_match_1": 8.75, "eval_n_ngrams_match_2": 5.0, "eval_n_ngrams_match_3": 3.5, "eval_num_true_words": 16.0, "eval_num_pred_words": 13.75, "eval_bleu_score": 31.934171484731365, "eval_bleu_score_sem": 14.842521437478405, "eval_rouge_score": 0.6470382882882882, "eval_exact_match": 0.0, "eval_exact_match_sem": 0.0, "eval_ada_emb_cos_sim_mean": 0.9159811735153198, "eval_ada_emb_cos_sim_sem": 0.023651350289583206, "eval_emb_cos_sim": 0.9949486255645752, "eval_emb_cos_sim_sem": 0.001761533203534782, "eval_emb_top1_equal": 0.25, "eval_emb_top1_equal_sem": 0.25, "eval_perplexity": 3.1925714301767956, "eval_runtime": 94.1794, "eval_samples_per_second": 0.042, "eval_steps_per_second": 0.011, "_eval_args": {"alias": "jxm/t5-base__llama-7b-chat__one-million-instructions", "dataset": "python_code_alpaca", "num_samples": 4, "embedder_model_name": "meta-llama/Llama-2-7b-chat-hf"}}