{"metadata":{"accelerator":"GPU","colab":{"gpuType":"T4","provenance":[]},"gpuClass":"standard","kernelspec":{"name":"python3","display_name":"Python 3","language":"python"},"language_info":{"name":"python","version":"3.10.13","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"},"kaggle":{"accelerator":"nvidiaTeslaT4","dataSources":[{"sourceId":7571253,"sourceType":"datasetVersion","datasetId":4407676},{"sourceId":7678915,"sourceType":"datasetVersion","datasetId":4479814},{"sourceId":7713636,"sourceType":"datasetVersion","datasetId":4504654},{"sourceId":7964016,"sourceType":"datasetVersion","datasetId":4685329},{"sourceId":8017122,"sourceType":"datasetVersion","datasetId":4723613}],"dockerImageVersionId":30684,"isInternetEnabled":true,"language":"python","sourceType":"notebook","isGpuEnabled":true}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"markdown","source":"
T\nThe objective of this notebook is to evaluate the performance of Gemini-1.5-Pro, Gemini-Pro, OpenHermes, and Mistral-7B using the Table-extract Benchmark dataset available at Hugging Face.
\n\n | context | \nanswer | \n
---|---|---|
0 | \naircraft ... | \n{\"aircraft\":{\"0\":\"robinson r - 22\",\"1\":\"bell 2... | \n
1 | \norder year manufacturer mod... | \n{\"order year\":{\"0\":\"1992 - 93\",\"1\":\"1996\",\"2\":... | \n
2 | \nplayer no nationality ... | \n{\"player\":{\"0\":\"quincy acy\",\"1\":\"hassan adams\"... | \n
3 | \nplayer no nationali... | \n{\"player\":{\"0\":\"patrick o'bryant\",\"1\":\"jermain... | \n
4 | \nplayer no nationality ... | \n{\"player\":{\"0\":\"mark baker\",\"1\":\"marcus banks\"... | \n
\n | context | \nanswer | \n
---|---|---|
0 | \naircraft ... | \n[{'aircraft': 'robinson r - 22', 'description'... | \n
1 | \norder year manufacturer mod... | \n[{'order year': '1992 - 93', 'manufacturer': '... | \n
2 | \nplayer no nationality ... | \n[{'player': 'quincy acy', 'no': '4', 'national... | \n
3 | \nplayer no nationali... | \n[{'player': 'patrick o'bryant', 'no': 13, 'nat... | \n
4 | \nplayer no nationality ... | \n[{'player': 'mark baker', 'no': '3', 'national... | \n