from datasets import load_dataset import pandas as pd from translate import Translator dataset = load_dataset("iamtarun/python_code_instructions_18k_alpaca") train_dataset = dataset['train'][900:1000] instruction_list = train_dataset['instruction'] input_list = train_dataset['input'] output_list = train_dataset['output'] # translator = Translator(to_lang="zh") # for idx in range(len(instruction_list)): # instruction_list[idx] = translator.translate(instruction_list[idx]) init_df = pd.DataFrame({'instruction': instruction_list, 'input': input_list, 'output': output_list}) init_df.to_excel('/Users/yangweipeng/code/excel/python_code_instructions_18k_alpaca.xlsx', index=True)