Shaltiel commited on
Commit
531a096
โ€ข
1 Parent(s): cf85943

Added SNLI score

Browse files
Files changed (1) hide show
  1. src/about.py +44 -4
src/about.py CHANGED
@@ -12,10 +12,11 @@ class Task:
12
  # ---------------------------------------------------
13
  class Tasks(Enum):
14
  # task_key in the json file, metric_key in the json file, name to display in the leaderboard
15
- task0 = Task("custom|heq-qa-tlnls|0", "heq_tlnls", "QA TLNLS (HeQ)")
16
- task1 = Task("custom|sentiment-acc|0", "sentiment_acc", "Sentiment Acc (Mafat)")
17
- task2 = Task("custom|winograd-acc|0", "winograd_acc", "Winograd (Binary) Acc (V. Schwartz)")
18
- task3 = Task("custom|he-en-trans-bleu|0", "sentence_bleu", "Translation BLEU")
 
19
 
20
  NUM_FEWSHOT = 0 # Change with your few shot
21
  # ---------------------------------------------------
@@ -170,6 +171,45 @@ English: Some sentence to translate to Hebrew <br/>
170
  Hebrew:
171
  </blockquote>
172
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
173
  """
174
 
175
  EVALUATION_QUEUE_TEXT = """
 
12
  # ---------------------------------------------------
13
  class Tasks(Enum):
14
  # task_key in the json file, metric_key in the json file, name to display in the leaderboard
15
+ task0 = Task("custom|snli-acc|0", "snli_acc", "SNLI Accuracy")
16
+ task1 = Task("custom|heq-qa-tlnls|0", "heq_tlnls", "QA TLNLS (HeQ)")
17
+ task2 = Task("custom|sentiment-acc|0", "sentiment_acc", "Sentiment Acc (Mafat)")
18
+ task3 = Task("custom|winograd-acc|0", "winograd_acc", "Winograd (Binary) Acc (V. Schwartz)")
19
+ task4 = Task("custom|he-en-trans-bleu|0", "sentence_bleu", "Translation BLEU")
20
 
21
  NUM_FEWSHOT = 0 # Change with your few shot
22
  # ---------------------------------------------------
 
171
  Hebrew:
172
  </blockquote>
173
 
174
+ 5. SNLI Accuracy
175
+
176
+ - **Source**: We took a sample of documents from the test-subset of the official SNLI corpus.
177
+
178
+ - **Scoring**: We compute the accuracy score on the predictions, expecting either "ืกืชื™ืจื”", "ื”ืชืืžื”", or "ื›ืœื•ื".
179
+
180
+ - **Number of examples**: There are a total of 210 examples - 70 from each class - where each example was translated using [Dicta's translation engine](https://translate.dicta.org.il), and then manually reviewed and corrected as needed.
181
+
182
+ - **Few-Shot Format**: For every prompt, we provide 12 few-shot examples, 4 from each category.
183
+
184
+ For example:
185
+
186
+
187
+ <blockquote dir="rtl" style='text-align: right; background-color: #f0f0f0'>
188
+ <p>
189
+ ื”ื ื—ืช ื™ืกื•ื“: ื ืขืจ ืžื ื’ืŸ ื‘ื—ืฆื•ืฆืจืชื• ื‘ืžื”ืœืš ื”ื•ืคืขื” ืขื ืœื”ืงืชื•.<br/>
190
+ ื”ืฉืขืจื”: ืœืืฃ ืื—ื“ ืื™ืŸ ื—ืฆื•ืฆืจื”.<br/>
191
+ ืชืฉื•ื‘ื”: ืกืชื™ืจื”<br/>
192
+
193
+ ...
194
+
195
+ ื”ื ื—ืช ื™ืกื•ื“: ื”ื ืขืจื” ืœื‘ื•ืฉื” ื‘ืžืขื™ืœ ื—ื•ื, ื‘ืขื•ื“ื” ืคื•ืกืขืช ื‘ืฉืœื’.<br/>
196
+ ื”ืฉืขืจื”: ื”ื’ื‘ืจืช ื”ืœื•ื‘ืฉืช ืžืขื™ืœ ืžื—ืคืฉืช ืืช ื›ืœื‘ื” ื”ืื•ื‘ื“.<br/>
197
+ ืชืฉื•ื‘ื”: ื›ืœื•ื<br/>
198
+
199
+ ...
200
+
201
+ ื”ื ื—ืช ื™ืกื•ื“: ืกืคื™ื ืชึพืคืืจ ื‘ื” ืื ืฉื™ื ืขื•ืœื™ื ื•ื™ื•ืจื“ื™ื.<br/>
202
+ ื”ืฉืขืจื”: ืื ืฉื™ื ืขื•ืœื™ื ื•ื™ื•ืจื“ื™ื ืžืกืคื™ื ื•ืช.<br/>
203
+ ืชืฉื•ื‘ื”: ื”ืชืืžื”<br/>
204
+
205
+ ...
206
+
207
+ ื”ื ื—ืช ื™ืกื•ื“: ื”ื ื—ื” ื—ื“ืฉื”<br/>
208
+ ื”ืฉืขืจื”: ื”ืฉืขืจื” ื—ื“ืฉื”<br/>
209
+ ืชืฉื•ื‘ื”:
210
+ </p>
211
+ </blockquote>
212
+
213
  """
214
 
215
  EVALUATION_QUEUE_TEXT = """