File size: 502 Bytes
2beb46b
04c6827
 
 
 
 
2beb46b
 
 
f59ef60
2beb46b
04c6827
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
import os
#import pandas as pd
#import pyarrow
#import fastparquet
from datasets import load_dataset_builder
from datasets import load_dataset
access_token = os.environ.get('HFTOKEN') 
data_files = {'train': ['train.zip', 'train.csv'], 'test': 'test.zip'}
dataset = load_dataset('competitions/aiornot',
                       token=access_token,
                       data_files=data_files)
def read_par(file):
    parquet_file = "data.parquet"
    df = pd.read_parquet(parquet_file, engine='pyarrow')