Skip to content

Commit

Permalink
Fix TPCH data conversion
Browse files Browse the repository at this point in the history
  • Loading branch information
Jefffrey committed Sep 23, 2024
1 parent b8ec195 commit 5f6b8da
Showing 1 changed file with 4 additions and 2 deletions.
6 changes: 4 additions & 2 deletions scripts/convert_tpch.py
Original file line number Diff line number Diff line change
Expand Up @@ -113,9 +113,11 @@
}

for table in tables:
schema = schemas[table]
tbl = csv.read_csv(
f"benchmark_data/{table}.tbl",
read_options=csv.ReadOptions(column_names=schema.names),
parse_options=csv.ParseOptions(delimiter="|"),
convert_options=csv.ConvertOptions(column_types=schemas[table]),
convert_options=csv.ConvertOptions(column_types=schema),
)
orc.write_table(tbl, f"benchmark_data/{table}.orc", compression="zstd")
orc.write_table(tbl, f"benchmark_data/{table}.orc")

0 comments on commit 5f6b8da

Please sign in to comment.