Skip to content

Commit

Permalink
feat: generate full connector catalog json (#18562)
Browse files Browse the repository at this point in the history
* move combo catalog generator from cloud to oss, trigger on processResources

* generate catalog

* regenerate catalog

* add test

* add explicit gradle task for generating combo catalog

* run format

* ignore generated file from the formatter

* update generated catalog

* ignore oss catalog

* fix ignore path
  • Loading branch information
pedroslopez authored Nov 3, 2022
1 parent 74792c1 commit bf43f62
Show file tree
Hide file tree
Showing 5 changed files with 250 additions and 0 deletions.
3 changes: 3 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -71,6 +71,9 @@ docs/SUMMARY.md
# Files generated by unit tests
**/specs_secrets_mask.yaml

# Files generated for uploading to GCS
airbyte-config/**/resources/seed/oss_catalog.json

# Helm charts .tgz dependencies
charts/**/charts

Expand Down
15 changes: 15 additions & 0 deletions airbyte-config/specs/build.gradle
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@ dependencies {

implementation project(':airbyte-commons')
implementation project(':airbyte-commons-cli')
implementation project(':airbyte-commons-docker')
implementation project(':airbyte-config:config-models')
implementation project(':airbyte-protocol:protocol-models')
implementation project(':airbyte-json-validation')
Expand All @@ -32,4 +33,18 @@ task generateConnectorSpecsMask(type: JavaExec, dependsOn: generateSeedConnector

project(":airbyte-config:init").tasks.processResources.dependsOn(generateConnectorSpecsMask)

task generateCombinedConnectorCatalog(type: JavaExec, dependsOn: generateSeedConnectorSpecs) {
classpath = sourceSets.main.runtimeClasspath

mainClass = 'io.airbyte.config.specs.CombinedConnectorCatalogGenerator'

args '--seed-root'
args new File(project(":airbyte-config:init").projectDir, '/src/main/resources/seed')

args '--output-filename'
args 'oss_catalog.json'
}

project(":airbyte-config:init").tasks.processResources.dependsOn(generateCombinedConnectorCatalog)

Task publishArtifactsTask = getPublishArtifactsTask("$rootProject.ext.version", project)
Original file line number Diff line number Diff line change
@@ -0,0 +1,109 @@
/*
* Copyright (c) 2022 Airbyte, Inc., all rights reserved.
*/

package io.airbyte.config.specs;

import com.fasterxml.jackson.databind.JsonNode;
import com.fasterxml.jackson.databind.node.BooleanNode;
import com.fasterxml.jackson.databind.node.ObjectNode;
import com.google.common.annotations.VisibleForTesting;
import io.airbyte.commons.cli.Clis;
import io.airbyte.commons.docker.DockerUtils;
import io.airbyte.commons.io.IOs;
import io.airbyte.commons.json.Jsons;
import io.airbyte.commons.util.MoreIterators;
import io.airbyte.commons.yaml.Yamls;
import io.airbyte.config.AirbyteConfigValidator;
import io.airbyte.config.CombinedConnectorCatalog;
import io.airbyte.config.ConfigSchema;
import io.airbyte.config.DockerImageSpec;
import io.airbyte.config.StandardDestinationDefinition;
import io.airbyte.config.StandardSourceDefinition;
import java.nio.file.Path;
import java.util.List;
import java.util.Map;
import java.util.stream.Collectors;
import org.apache.commons.cli.CommandLine;
import org.apache.commons.cli.Option;
import org.apache.commons.cli.Options;

/**
* Generates a combined representation of the connector catalog that includes Sources, Destinations
* and their specs all in one. This connector catalog can then be served and loaded from a
* RemoteDefinitionsProvider.
*/
public class CombinedConnectorCatalogGenerator {

private static final Option SEED_ROOT_OPTION = Option.builder("s").longOpt("seed-root").hasArg(true).required(true)
.desc("path to where seed resource files are stored").build();
private static final Option OUTPUT_FILENAME_OPTION = Option.builder("o").longOpt("output-filename").hasArg(true).required(true)
.desc("name for the generated catalog json file").build();
private static final Options OPTIONS = new Options().addOption(SEED_ROOT_OPTION).addOption(OUTPUT_FILENAME_OPTION);

public static void main(final String[] args) throws Exception {
final CommandLine parsed = Clis.parse(args, OPTIONS);
final Path outputRoot = Path.of(parsed.getOptionValue(SEED_ROOT_OPTION.getOpt()));
final String outputFileName = parsed.getOptionValue(OUTPUT_FILENAME_OPTION.getOpt());

final CombinedConnectorCatalogGenerator combinedConnectorCatalogGenerator = new CombinedConnectorCatalogGenerator();
combinedConnectorCatalogGenerator.run(outputRoot, outputFileName);
}

public void run(final Path outputRoot, final String outputFileName) {
final List<JsonNode> destinationDefinitionsJson = getSeedJson(outputRoot, SeedConnectorType.DESTINATION.getDefinitionFileName());
final List<JsonNode> destinationSpecsJson = getSeedJson(outputRoot, SeedConnectorType.DESTINATION.getSpecFileName());
final List<JsonNode> sourceDefinitionsJson = getSeedJson(outputRoot, SeedConnectorType.SOURCE.getDefinitionFileName());
final List<JsonNode> sourceSpecsJson = getSeedJson(outputRoot, SeedConnectorType.SOURCE.getSpecFileName());

mergeSpecsIntoDefinitions(destinationDefinitionsJson, destinationSpecsJson, ConfigSchema.STANDARD_DESTINATION_DEFINITION);
mergeSpecsIntoDefinitions(sourceDefinitionsJson, sourceSpecsJson, ConfigSchema.STANDARD_SOURCE_DEFINITION);

final CombinedConnectorCatalog combinedCatalog = new CombinedConnectorCatalog()
.withDestinations(destinationDefinitionsJson.stream().map(j -> Jsons.object(j, StandardDestinationDefinition.class)).toList())
.withSources(sourceDefinitionsJson.stream().map(j -> Jsons.object(j, StandardSourceDefinition.class)).toList());

IOs.writeFile(outputRoot.resolve(outputFileName), Jsons.toPrettyString(Jsons.jsonNode(combinedCatalog)));
}

private List<JsonNode> getSeedJson(final Path root, final String fileName) {
final String jsonString = IOs.readFile(root, fileName);
return MoreIterators.toList(Yamls.deserialize(jsonString).elements());
}

/**
* Updates all connector definitions with provided specs.
*
* @param definitions - List of Source or Destination Definitions as generated in the seed files
* @param specs - List of connector specs as generated in the seed files (see
* {@link DockerImageSpec})
*/
@VisibleForTesting
void mergeSpecsIntoDefinitions(final List<JsonNode> definitions, final List<JsonNode> specs, final ConfigSchema configSchema) {
final Map<String, JsonNode> specsByImage = specs.stream().collect(Collectors.toMap(
json -> json.get("dockerImage").asText(),
json -> json.get("spec")));

for (final JsonNode definition : definitions) {
final String dockerImage = DockerUtils.getTaggedImageName(
definition.get("dockerRepository").asText(),
definition.get("dockerImageTag").asText());
final JsonNode specConfigJson = specsByImage.get(dockerImage);

if (specConfigJson == null) {
throw new UnsupportedOperationException(String.format("A spec for docker image %s was not found", dockerImage));
}

((ObjectNode) definition).set("spec", specConfigJson);

if (!definition.hasNonNull("public")) {
// All definitions in the catalog are public by default
((ObjectNode) definition).set("public", BooleanNode.TRUE);
}

AirbyteConfigValidator.AIRBYTE_CONFIG_VALIDATOR.ensureAsRuntime(configSchema, definition);
}

}

}
Original file line number Diff line number Diff line change
@@ -0,0 +1,122 @@
/*
* Copyright (c) 2022 Airbyte, Inc., all rights reserved.
*/

package io.airbyte.config.specs;

import static org.junit.jupiter.api.Assertions.assertEquals;
import static org.junit.jupiter.api.Assertions.assertThrows;

import com.fasterxml.jackson.databind.JsonNode;
import com.google.common.collect.ImmutableMap;
import io.airbyte.commons.json.Jsons;
import io.airbyte.config.ConfigSchema;
import io.airbyte.config.DockerImageSpec;
import io.airbyte.config.StandardDestinationDefinition;
import io.airbyte.protocol.models.ConnectorSpecification;
import java.util.List;
import java.util.UUID;
import org.junit.jupiter.api.BeforeEach;
import org.junit.jupiter.api.Test;

class CombinedConnectorCatalogGeneratorTest {

private static final UUID DEF_ID1 = UUID.randomUUID();
private static final UUID DEF_ID2 = UUID.randomUUID();
private static final String CONNECTOR_NAME1 = "connector1";
private static final String CONNECTOR_NAME2 = "connector2";
private static final String DOCUMENTATION_URL = "https://www.example.com";
private static final String DOCKER_REPOSITORY1 = "airbyte/connector1";
private static final String DOCKER_REPOSITORY2 = "airbyte/connector2";
private static final String DOCKER_TAG1 = "0.1.0";
private static final String DOCKER_TAG2 = "0.2.0";

private CombinedConnectorCatalogGenerator catalogGenerator;

@BeforeEach
void setup() {
catalogGenerator = new CombinedConnectorCatalogGenerator();
}

@Test
void testMergeSpecsIntoDefinitions() {
final StandardDestinationDefinition destinationDefinition1 = new StandardDestinationDefinition()
.withDestinationDefinitionId(DEF_ID1)
.withDockerRepository(DOCKER_REPOSITORY1)
.withDockerImageTag(DOCKER_TAG1)
.withName(CONNECTOR_NAME1)
.withDocumentationUrl(DOCUMENTATION_URL)
.withSpec(new ConnectorSpecification());
final StandardDestinationDefinition destinationDefinition2 = new StandardDestinationDefinition()
.withDestinationDefinitionId(DEF_ID2)
.withDockerRepository(DOCKER_REPOSITORY2)
.withDockerImageTag(DOCKER_TAG2)
.withName(CONNECTOR_NAME2)
.withDocumentationUrl(DOCUMENTATION_URL)
.withSpec(new ConnectorSpecification());
final DockerImageSpec destinationSpec1 = new DockerImageSpec().withDockerImage(DOCKER_REPOSITORY1 + ":" + DOCKER_TAG1)
.withSpec(new ConnectorSpecification().withConnectionSpecification(Jsons.jsonNode(ImmutableMap.of(
"foo1",
"bar1"))));
final DockerImageSpec destinationSpec2 = new DockerImageSpec().withDockerImage(DOCKER_REPOSITORY2 + ":" + DOCKER_TAG2)
.withSpec(new ConnectorSpecification().withConnectionSpecification(Jsons.jsonNode(ImmutableMap.of(
"foo2",
"bar2"))));

final List<JsonNode> definitions = List.of(Jsons.jsonNode(destinationDefinition1), Jsons.jsonNode(destinationDefinition2));
final List<JsonNode> specs = List.of(Jsons.jsonNode(destinationSpec1), Jsons.jsonNode(destinationSpec2));

catalogGenerator.mergeSpecsIntoDefinitions(definitions, specs, ConfigSchema.STANDARD_DESTINATION_DEFINITION);

final StandardDestinationDefinition expectedDefinition1 = new StandardDestinationDefinition()
.withDestinationDefinitionId(DEF_ID1)
.withDockerRepository(DOCKER_REPOSITORY1)
.withDockerImageTag(DOCKER_TAG1)
.withName(CONNECTOR_NAME1)
.withDocumentationUrl(DOCUMENTATION_URL)
.withSpec(destinationSpec1.getSpec());

final StandardDestinationDefinition expectedDefinition2 = new StandardDestinationDefinition()
.withDestinationDefinitionId(DEF_ID2)
.withDockerRepository(DOCKER_REPOSITORY2)
.withDockerImageTag(DOCKER_TAG2)
.withName(CONNECTOR_NAME2)
.withDocumentationUrl(DOCUMENTATION_URL)
.withSpec(destinationSpec2.getSpec());

assertEquals(Jsons.jsonNode(expectedDefinition1), definitions.get(0));
assertEquals(Jsons.jsonNode(expectedDefinition2), definitions.get(1));
}

@Test
void testMergeSpecsIntoDefinitionsThrowsOnMissingSpec() {
final StandardDestinationDefinition destinationDefinition1 = new StandardDestinationDefinition()
.withDestinationDefinitionId(DEF_ID1)
.withDockerRepository(DOCKER_REPOSITORY1)
.withDockerImageTag(DOCKER_TAG1)
.withName(CONNECTOR_NAME1)
.withDocumentationUrl(DOCUMENTATION_URL)
.withSpec(new ConnectorSpecification());
final List<JsonNode> definitions = List.of(Jsons.jsonNode(destinationDefinition1));
final List<JsonNode> specs = List.of();

assertThrows(UnsupportedOperationException.class,
() -> catalogGenerator.mergeSpecsIntoDefinitions(definitions, specs, ConfigSchema.STANDARD_DESTINATION_DEFINITION));
}

@Test
void testMergeSpecsIntoDefinitionsThrowsOnInvalidFormat() {
final JsonNode invalidDefinition = Jsons.jsonNode(ImmutableMap.of("dockerRepository", DOCKER_REPOSITORY1, "dockerImageTag", DOCKER_TAG1));
final DockerImageSpec destinationSpec = new DockerImageSpec().withDockerImage(DOCKER_REPOSITORY1 + ":" + DOCKER_TAG1)
.withSpec(new ConnectorSpecification().withConnectionSpecification(Jsons.jsonNode(ImmutableMap.of(
"foo1",
"bar1"))));

final List<JsonNode> definitions = List.of(Jsons.jsonNode(invalidDefinition));
final List<JsonNode> specs = List.of(Jsons.jsonNode(destinationSpec));

assertThrows(RuntimeException.class,
() -> catalogGenerator.mergeSpecsIntoDefinitions(definitions, specs, ConfigSchema.STANDARD_DESTINATION_DEFINITION));
}

}
1 change: 1 addition & 0 deletions build.gradle
Original file line number Diff line number Diff line change
Expand Up @@ -121,6 +121,7 @@ def createSpotlessTarget = { pattern ->
'secrets',
'charts', // Helm charts often have injected template strings that will fail general linting. Helm linting is done separately.
'resources/seed/*_specs.yaml', // Do not remove - this is necessary to prevent diffs in our github workflows, as the file diff check runs between the Format step and the Build step, the latter of which generates the file.
'resources/seed/*_catalog.json', // Do not remove - this is also necessary to prevent diffs in our github workflows
'airbyte-integrations/connectors/source-amplitude/unit_tests/api_data/zipped.json', // Zipped file presents as non-UTF-8 making spotless sad
'airbyte-webapp', // The webapp module uses its own auto-formatter, so spotless is not necessary here
'airbyte-webapp-e2e-tests', // This module also uses its own auto-formatter
Expand Down

0 comments on commit bf43f62

Please sign in to comment.