{ "cells": [ { "metadata": {}, "cell_type": "markdown", "source": "# Data Stats", "id": "694a6cc631d4ab93" }, { "metadata": { "ExecuteTime": { "end_time": "2024-10-15T18:43:07.644299Z", "start_time": "2024-10-15T18:43:02.316453Z" } }, "cell_type": "code", "source": [ "from datasets import load_dataset\n", "\n", "\n", "df = load_dataset(\"JetBrains-Research/synthetic-commit-msg-edits\", \"all_pairs\", split=\"train\").to_pandas()\n", "df.head()" ], "id": "ed42f4f83199feb2", "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "Downloading data: 100%|██████████| 6.35M/6.35M [00:00<00:00, 9.95MB/s]\n" ] }, { "data": { "text/plain": [ "Generating train split: 0 examples [00:00, ? examples/s]" ], "application/vnd.jupyter.widget-view+json": { "version_major": 2, "version_minor": 0, "model_id": "1a0523289d424b29974b60d017643280" } }, "metadata": {}, "output_type": "display_data" }, { "data": { "text/plain": [ " hash repo \\\n", "0 2febb99eee8ed71c9122db88ca58dd33be0b9550 mesonbuild/meson \n", "1 2febb99eee8ed71c9122db88ca58dd33be0b9550 mesonbuild/meson \n", "2 2febb99eee8ed71c9122db88ca58dd33be0b9550 mesonbuild/meson \n", "3 2febb99eee8ed71c9122db88ca58dd33be0b9550 mesonbuild/meson \n", "4 2febb99eee8ed71c9122db88ca58dd33be0b9550 mesonbuild/meson \n", "\n", " G_text \\\n", "0 Enhance OptionOverrideProxy and simplify optio... \n", "1 Enhance OptionOverrideProxy and simplify optio... \n", "2 Enhance OptionOverrideProxy and simplify optio... \n", "3 Enhance OptionOverrideProxy and simplify optio... \n", "4 Enhance OptionOverrideProxy and simplify optio... \n", "\n", " E_text G_type \\\n", "0 Enhance OptionOverrideProxy for multiple optio... synthetic_backward \n", "1 Refactor OptionOverrideProxy and Backend class... synthetic_backward \n", "2 Refactor OptionOverrideProxy and backend optio... synthetic_backward \n", "3 Refactor: Enhance OptionOverrideProxy for mult... synthetic_backward \n", "4 Refactor OptionOverrideProxy and add target-sp... synthetic_backward \n", "\n", " E_type is_related \n", "0 expert_labeled True \n", "1 synthetic_forward True \n", "2 synthetic_forward True \n", "3 synthetic_forward True \n", "4 synthetic_forward_from_backward False " ], "text/html": [ "
\n", " | hash | \n", "repo | \n", "G_text | \n", "E_text | \n", "G_type | \n", "E_type | \n", "is_related | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "2febb99eee8ed71c9122db88ca58dd33be0b9550 | \n", "mesonbuild/meson | \n", "Enhance OptionOverrideProxy and simplify optio... | \n", "Enhance OptionOverrideProxy for multiple optio... | \n", "synthetic_backward | \n", "expert_labeled | \n", "True | \n", "
1 | \n", "2febb99eee8ed71c9122db88ca58dd33be0b9550 | \n", "mesonbuild/meson | \n", "Enhance OptionOverrideProxy and simplify optio... | \n", "Refactor OptionOverrideProxy and Backend class... | \n", "synthetic_backward | \n", "synthetic_forward | \n", "True | \n", "
2 | \n", "2febb99eee8ed71c9122db88ca58dd33be0b9550 | \n", "mesonbuild/meson | \n", "Enhance OptionOverrideProxy and simplify optio... | \n", "Refactor OptionOverrideProxy and backend optio... | \n", "synthetic_backward | \n", "synthetic_forward | \n", "True | \n", "
3 | \n", "2febb99eee8ed71c9122db88ca58dd33be0b9550 | \n", "mesonbuild/meson | \n", "Enhance OptionOverrideProxy and simplify optio... | \n", "Refactor: Enhance OptionOverrideProxy for mult... | \n", "synthetic_backward | \n", "synthetic_forward | \n", "True | \n", "
4 | \n", "2febb99eee8ed71c9122db88ca58dd33be0b9550 | \n", "mesonbuild/meson | \n", "Enhance OptionOverrideProxy and simplify optio... | \n", "Refactor OptionOverrideProxy and add target-sp... | \n", "synthetic_backward | \n", "synthetic_forward_from_backward | \n", "False | \n", "