Spaces:
Sleeping
Sleeping
| from datasets import load_dataset | |
| import pandas as pd | |
| from translate import Translator | |
| dataset = load_dataset("iamtarun/python_code_instructions_18k_alpaca") | |
| train_dataset = dataset['train'][900:1000] | |
| instruction_list = train_dataset['instruction'] | |
| input_list = train_dataset['input'] | |
| output_list = train_dataset['output'] | |
| # translator = Translator(to_lang="zh") | |
| # for idx in range(len(instruction_list)): | |
| # instruction_list[idx] = translator.translate(instruction_list[idx]) | |
| init_df = pd.DataFrame({'instruction': instruction_list, 'input': input_list, 'output': output_list}) | |
| init_df.to_excel('/Users/yangweipeng/code/excel/python_code_instructions_18k_alpaca.xlsx', index=True) | |