From 83fb7e36a228a22aeb1ae51898cca301bbd0717c Mon Sep 17 00:00:00 2001 From: Sagar Lakshmipathy <18vidhyasagar@gmail.com> Date: Fri, 17 Nov 2023 17:07:31 -0800 Subject: [PATCH] Docs update quickstart iceberg (#239) * add note for Iceberg sourceFormat * Revert "add note for Iceberg sourceFormat" This reverts commit 245e08e6cffa2459e5f34e341382cfba5974d4ae. * add note for Iceberg sourceFormat * Update how-to.md add `people` to tableBasePath * Update how-to.md fixed typos * clarified context on tableDataPath --- website/docs/how-to.md | 19 +++++++++++++------ 1 file changed, 13 insertions(+), 6 deletions(-) diff --git a/website/docs/how-to.md b/website/docs/how-to.md index 95c3804b..cb486d55 100644 --- a/website/docs/how-to.md +++ b/website/docs/how-to.md @@ -270,9 +270,13 @@ targetFormats: datasets: - tableBasePath: file:///tmp/iceberg-dataset/people - dataBasePath: file:///tmp/iceberg-dataset/people/data + tableDataPath: file:///tmp/iceberg-dataset/people/data tableName: people ``` +:::note Note: +Add `tableDataPath` for ICEBERG sourceFormat if the `tableBasePath` is different from the path to the data. +::: + @@ -296,7 +300,7 @@ targetFormats: - ICEBERG datasets: - - tableBasePath: s3://path/to/hudi-data # replace this with gs://path/to/hudi_data if your data is in GCS. + tableBasePath: s3://path/to/hudi-dataset/people # replace this with gs://path/to/hudi-dataset/people if your data is in GCS. tableName: people partitionSpec: city:VALUE ``` @@ -311,7 +315,7 @@ targetFormats: - ICEBERG datasets: - - tableBasePath: s3://path/to/delta-data # replace this with gs://path/to/delta_data if your data is in GCS. + tableBasePath: s3://path/to/delta-dataset/people # replace this with gs://path/to/delta-dataset/people if your data is in GCS. tableName: people ``` @@ -325,10 +329,13 @@ targetFormats: - DELTA datasets: - - tableBasePath: s3://path/to/iceberg # replace this with gs://path/to/iceberg_data if your data is in GCS. - tableDataPath: s3://path/to/iceberg/data + tableBasePath: s3://path/to/iceberg-dataset/people # replace this with gs://path/to/iceberg-dataset/people if your data is in GCS. + tableDataPath: s3://path/to/iceberg-dataset/people/data tableName: people ``` +:::note Note: +Add `tableDataPath` for ICEBERG sourceFormat if the `tableBasePath` is different from the path to the data. +::: @@ -357,4 +364,4 @@ that can be used to query the source table in different target table formats. ## Next steps Go through the [Catalog Integration guides](/docs/catalogs-index) to register the OneTable synced tables -in different data catalogs. \ No newline at end of file +in different data catalogs.