dockerspace / data.py
glennrory's picture
Update data.py
2f85126 verified
raw
history blame contribute delete
161 Bytes
from datasets import load_dataset
def get_data():
ds = load_dataset("codeparrot/github-code", streaming=True, split="train")
print(next(iter(ds)))