{"eval_pred_num_tokens": 43.125, "eval_true_num_tokens": 17.8515625, "eval_token_set_precision": 0.48400679044932376, "eval_token_set_recall": 0.34343714585567153, "eval_token_set_f1": 0.3803040307433806, "eval_token_set_f1_sem": 0.02296623107834086, "eval_n_ngrams_match_1": 7.5, "eval_n_ngrams_match_2": 5.535, "eval_n_ngrams_match_3": 4.84, "eval_num_true_words": 14.825, "eval_num_pred_words": 36.6, "eval_bleu_score": 21.29580272831924, "eval_bleu_score_sem": 2.0316839202058663, "eval_exact_match": 0.005, "eval_exact_match_sem": 0.005000000000000001, "eval_ada_emb_cos_sim_mean": 0.7857118248939514, "eval_ada_emb_cos_sim_sem": 0.007256609934760893, "eval_emb_cos_sim": 0.9983388185501099, "eval_emb_cos_sim_sem": 0.0012364102294668555, "eval_emb_top1_equal": 0.75, "eval_emb_top1_equal_sem": 0.25, "eval_runtime": 321.1581, "eval_samples_per_second": 0.623, "eval_steps_per_second": 0.156, "_eval_args": {"alias": "jailbreak", "prompt": "11_return", "max_seq_length": 64, "num_samples": 200, "embedder_model_name": "meta-llama/Llama-2-13b-hf", "dataset": "anthropic_toxic_prompts", "gpt_version": "gpt-3.5-turbo-0613", "take_first_line": true}}