Skip to content

Commit

Permalink
Add manifest for smaller CH-BenCHmark dataset for debugging
Browse files Browse the repository at this point in the history
  • Loading branch information
geoffxy committed Apr 15, 2024
1 parent 940749a commit 835c5b2
Showing 1 changed file with 88 additions and 0 deletions.
88 changes: 88 additions & 0 deletions config/manifests/manifest_chbenchmark_small.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,88 @@
s3_bucket: geoffxy-research
s3_bucket_region: us-east-1
schema_name: chbenchmark_small

tables:
- table_name: warehouse
s3_path: chbenchmark_small/warehouse/warehouse.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: item
s3_path: chbenchmark_small/item/item.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: stock
s3_path: chbenchmark_small/stock/stock.tbl
aurora_options: FORMAT CSV, HEADER, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: district
s3_path: chbenchmark_small/district/district.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: customer
s3_path: chbenchmark_small/customer/customer.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: history
s3_path: chbenchmark_small/history/history.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: orders
s3_path: chbenchmark_small/orders/orders.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: new_order
s3_path: chbenchmark_small/new_order/new_order.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: order_line
s3_path: chbenchmark_small/order_line/order_line.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: supplier
s3_path: chbenchmark_small/supplier/supplier.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: nation
s3_path: chbenchmark_small/nation/nation.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

- table_name: region
s3_path: chbenchmark_small/region/region.tbl
aurora_options: FORMAT CSV, HEADER true, ESCAPE ''\'', DELIMITER ''|''
redshift_options: CSV IGNOREHEADER 1 DELIMITER '|' BLANKSASNULL
athena_options1: ROW FORMAT DELIMITED FIELDS TERMINATED BY '|' NULL DEFINED AS '' STORED AS TEXTFILE
athena_options2: TBLPROPERTIES ('skip.header.line.count' = '1')

0 comments on commit 835c5b2

Please sign in to comment.