{"metadata":{"accelerator":"GPU","colab":{"gpuType":"T4","provenance":[]},"gpuClass":"standard","kernelspec":{"name":"python3","display_name":"Python 3","language":"python"},"language_info":{"name":"python","version":"3.10.13","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"},"kaggle":{"accelerator":"nvidiaTeslaT4","dataSources":[{"sourceId":7571253,"sourceType":"datasetVersion","datasetId":4407676},{"sourceId":7678915,"sourceType":"datasetVersion","datasetId":4479814},{"sourceId":7713636,"sourceType":"datasetVersion","datasetId":4504654},{"sourceId":8017122,"sourceType":"datasetVersion","datasetId":4723613},{"sourceId":4298,"sourceType":"modelInstanceVersion","modelInstanceId":3093},{"sourceId":5110,"sourceType":"modelInstanceVersion","modelInstanceId":3898}],"dockerImageVersionId":30674,"isInternetEnabled":true,"language":"python","sourceType":"notebook","isGpuEnabled":true}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"markdown","source":"
T\nThe objective of this notebook is to evaluate the performance of Openchat-3.5-1210 and dolphin-2.2.1-mistral-7b using the Table-extract Benchmark dataset available at Hugging Face.
\n\n | context | \nanswer | \n
---|---|---|
0 | \naircraft ... | \n{\"aircraft\":{\"0\":\"robinson r - 22\",\"1\":\"bell 2... | \n
1 | \norder year manufacturer mod... | \n{\"order year\":{\"0\":\"1992 - 93\",\"1\":\"1996\",\"2\":... | \n
2 | \nplayer no nationality ... | \n{\"player\":{\"0\":\"quincy acy\",\"1\":\"hassan adams\"... | \n
3 | \nplayer no nationali... | \n{\"player\":{\"0\":\"patrick o'bryant\",\"1\":\"jermain... | \n
4 | \nplayer no nationality ... | \n{\"player\":{\"0\":\"mark baker\",\"1\":\"marcus banks\"... | \n