GoogleCloudPlatform · copybara-service · May 10, 2024 · Apr 30, 2024 · Apr 30, 2024 · Apr 30, 2024
diff --git a/v1/src/main/java/com/google/cloud/teleport/bigtable/BigtableToParquet.java b/v1/src/main/java/com/google/cloud/teleport/bigtable/BigtableToParquet.java
@@ -77,7 +77,7 @@ public interface Options extends PipelineOptions {
         order = 1,
         description = "Project ID",
         helpText =
-            "The ID of the Google Cloud project of the Cloud Bigtable instance that you want to read data from")
+            "The ID of the Google Cloud project of the Bigtable instance that you want to read data from.")
     ValueProvider<String> getBigtableProjectId();
 
     @SuppressWarnings("unused")
@@ -87,7 +87,7 @@ public interface Options extends PipelineOptions {
         order = 2,
         regexes = {"[a-z][a-z0-9\\-]+[a-z0-9]"},
         description = "Instance ID",
-        helpText = "The ID of the Cloud Bigtable instance that contains the table")
+        helpText = "The ID of the Bigtable instance that contains the table")
     ValueProvider<String> getBigtableInstanceId();
 
     @SuppressWarnings("unused")
@@ -97,7 +97,7 @@ public interface Options extends PipelineOptions {
         order = 3,
         regexes = {"[_a-zA-Z0-9][-_.a-zA-Z0-9]*"},
         description = "Table ID",
-        helpText = "The ID of the Cloud Bigtable table to export")
+        helpText = "The ID of the Bigtable table to export.")
     ValueProvider<String> getBigtableTableId();
 
     @SuppressWarnings("unused")
@@ -107,8 +107,7 @@ public interface Options extends PipelineOptions {
         order = 4,
         description = "Output file directory in Cloud Storage",
         helpText =
-            "The path and filename prefix for writing output files. Must end with a slash. DateTime formatting is used to parse directory path for date & time formatters.",
-        example = "gs://your-bucket/your-path")
+            "The Cloud Storage path where data is written. For example, gs://mybucket/somefolder.")
     ValueProvider<String> getOutputDirectory();
 
     @SuppressWarnings("unused")
@@ -117,7 +116,7 @@ public interface Options extends PipelineOptions {
     @TemplateParameter.Text(
         order = 5,
         description = "Parquet file prefix",
-        helpText = "The prefix of the Parquet file name. For example, \"table1-\"")
+        helpText = "The prefix of the Parquet filename. For example, output-")
     @Default.String("part")
     ValueProvider<String> getFilenamePrefix();
 
@@ -129,10 +128,7 @@ public interface Options extends PipelineOptions {
         optional = true,
         description = "Maximum output shards",
         helpText =
-            "The maximum number of output shards produced when writing. A higher number of "
-                + "shards means higher throughput for writing to Cloud Storage, but potentially higher "
-                + "data aggregation cost across shards when processing output Cloud Storage files. "
-                + "Default value is decided by Dataflow.")
+            "The number of output file shards. For example 2.")
     @Default.Integer(0)
     ValueProvider<Integer> getNumShards();
 

diff --git a/...ry-to-parquet/src/main/java/com/google/cloud/teleport/v2/templates/BigQueryToParquet.java b/...ry-to-parquet/src/main/java/com/google/cloud/teleport/v2/templates/BigQueryToParquet.java
@@ -146,7 +146,7 @@ public interface BigQueryToParquetOptions extends PipelineOptions {
     @TemplateParameter.BigQueryTable(
         order = 1,
         description = "BigQuery table to export",
-        helpText = "BigQuery table location to export in the format <project>:<dataset>.<table>.",
+        helpText = "The BigQuery input table location.",
         example = "your-project:your-dataset.your-table-name")
     @Required
     String getTableRef();
@@ -156,7 +156,7 @@ public interface BigQueryToParquetOptions extends PipelineOptions {
     @TemplateParameter.GcsWriteFile(
         order = 2,
         description = "Output Cloud Storage file(s)",
-        helpText = "Path and filename prefix for writing output files.",
+        helpText = "The Cloud Storage folder in which to write the Parquet files",
         example = "gs://your-bucket/export/")
     @Required
     String getBucket();
@@ -168,10 +168,7 @@ public interface BigQueryToParquetOptions extends PipelineOptions {
         optional = true,
         description = "Maximum output shards",
         helpText =
-            "The maximum number of output shards produced when writing. A higher number of shards"
-                + " means higher throughput for writing to Cloud Storage, but potentially higher"
-                + " data aggregation cost across shards when processing output Cloud Storage"
-                + " files.")
+            "(Optional) The number of output file shards. The default value is 1.")
     @Default.Integer(0)
     Integer getNumShards();
 
@@ -181,7 +178,7 @@ public interface BigQueryToParquetOptions extends PipelineOptions {
         order = 4,
         optional = true,
         description = "List of field names",
-        helpText = "Comma separated list of fields to select from the table.")
+        helpText = "(Optional) A comma-separated list of fields to select from the input BigQuery table.")
     String getFields();
 
     void setFields(String fields);