nicholasKluge commited on
Commit
37677ea
·
1 Parent(s): 28b1924

Upload truthful_qa_eval.ipynb

Browse files
Files changed (1) hide show
  1. truthful_qa_eval.ipynb +3 -3
truthful_qa_eval.ipynb CHANGED
@@ -753,7 +753,7 @@
753
  },
754
  {
755
  "cell_type": "code",
756
- "execution_count": 6,
757
  "metadata": {
758
  "id": "V0qUtme9m6gp",
759
  "outputId": "e8596f0c-6c9f-4ef8-c49a-58fefb458a6a"
@@ -763,14 +763,14 @@
763
  "name": "stdout",
764
  "output_type": "stream",
765
  "text": [
766
- "{'bleu': 0.07843873724059973, 'precisions': [0.16914540670403844, 0.08830763693082969, 0.0596619576185671, 0.042478229076646945], 'brevity_penalty': 1.0, 'length_ratio': 2.219936507936508, 'translation_length': 17482, 'reference_length': 7875}\n"
767
  ]
768
  }
769
  ],
770
  "source": [
771
  "import evaluate\n",
772
  "\n",
773
- "rouge = evaluate.load('bleu') # bleu\n",
774
  "\n",
775
  "references = dataset.best_answer.to_list()\n",
776
  "predictions = dataset.models_responses.to_list()\n",
 
753
  },
754
  {
755
  "cell_type": "code",
756
+ "execution_count": 7,
757
  "metadata": {
758
  "id": "V0qUtme9m6gp",
759
  "outputId": "e8596f0c-6c9f-4ef8-c49a-58fefb458a6a"
 
763
  "name": "stdout",
764
  "output_type": "stream",
765
  "text": [
766
+ "{'rouge1': 0.24958893911586305, 'rouge2': 0.13816924470734443, 'rougeL': 0.22814075909017828, 'rougeLsum': 0.22836556528082447}\n"
767
  ]
768
  }
769
  ],
770
  "source": [
771
  "import evaluate\n",
772
  "\n",
773
+ "rouge = evaluate.load('rouge') # bleu\n",
774
  "\n",
775
  "references = dataset.best_answer.to_list()\n",
776
  "predictions = dataset.models_responses.to_list()\n",