Code/preprocess
parquet2csv
Shy_un
2023. 8. 16. 11:46
import pandas as pd
import argparse
parser = argparse.ArgumentParser()
parser.add_argument('--dir', required=True, help='dir address') #C/.../file.parquet
parser.add_argument('--out', required=True, help='out address') #C/.../out.csv
args = parser.parse_args()
df = pd.read_parquet(args.dir, engine='pyarrow')
df.to_csv(args.out, index=False)