From f8da06bcc8d45a23b4e994d44e2ce7cf0fcb6df0 Mon Sep 17 00:00:00 2001 From: Yi Hu Date: Tue, 9 Jun 2026 14:05:36 -0400 Subject: [PATCH] FIx yaml doc generation --- sdks/python/apache_beam/yaml/standard_io.yaml | 1 - sdks/python/build.gradle | 28 +++++++++++++++---- 2 files changed, 22 insertions(+), 7 deletions(-) diff --git a/sdks/python/apache_beam/yaml/standard_io.yaml b/sdks/python/apache_beam/yaml/standard_io.yaml index 781d3de193ec..4f679c4a77c4 100644 --- a/sdks/python/apache_beam/yaml/standard_io.yaml +++ b/sdks/python/apache_beam/yaml/standard_io.yaml @@ -418,7 +418,6 @@ catalog_properties: 'catalog_properties' config_properties: 'config_properties' triggering_frequency_seconds: 'triggering_frequency_seconds' - append_batch_size: 'append_batch_size' location_prefix: 'location_prefix' partition_fields: 'partition_fields' table_properties: 'table_properties' diff --git a/sdks/python/build.gradle b/sdks/python/build.gradle index 5f09dff57e8f..b39b12f198e9 100644 --- a/sdks/python/build.gradle +++ b/sdks/python/build.gradle @@ -101,16 +101,32 @@ tasks.register("generateManagedIOPage") { } } +tasks.register("prepareExpansionServicesForYamlDocs") { + description "Builds all expansion services referenced in apache_beam/yaml/*.*" + + dependsOn ":sdks:java:extensions:schemaio-expansion-service:shadowJar" + dependsOn ":sdks:java:extensions:sql:expansion-service:shadowJar" + dependsOn ":sdks:java:io:expansion-service:shadowJar" + dependsOn ":sdks:java:io:google-cloud-platform:expansion-service:shadowJar" + + doLast { + // Copy expansion service jar into cache path (.apache_beam/cache/jars/). + copy { + from project.tasks.findByPath(":sdks:java:extensions:schemaio-expansion-service:shadowJar") + from project.tasks.findByPath(":sdks:java:extensions:sql:expansion-service:shadowJar") + from project.tasks.findByPath(":sdks:java:io:expansion-service:shadowJar") + from project.tasks.findByPath(":sdks:java:io:google-cloud-platform:expansion-service:shadowJar") + into "${System.getProperty('user.home')}/.apache_beam/cache/jars/" + } + } +} + tasks.register("generateYamlDocs") { description "Generates the reference documentation for all YAML transforms." dependsOn buildPython - // Need to build all expansion services referenced in apache_beam/yaml/*.* - // grep -oh 'sdk.*Jar' sdks/python/apache_beam/yaml/*.yaml | sort | uniq - dependsOn ":sdks:java:extensions:schemaio-expansion-service:shadowJar" - dependsOn ":sdks:java:extensions:sql:expansion-service:shadowJar" - dependsOn ":sdks:java:io:expansion-service:build" - dependsOn ":sdks:java:io:google-cloud-platform:expansion-service:build" + dependsOn prepareExpansionServicesForYamlDocs + def extraPackages = "pyyaml markdown docstring_parser pandas pygments Jinja2 virtualenv-clone" doLast {