Skip to content

Commit

Permalink
introduce proto
Browse files Browse the repository at this point in the history
  • Loading branch information
wenfengwang committed Aug 26, 2022
1 parent 6967005 commit ee09df1
Show file tree
Hide file tree
Showing 19 changed files with 360 additions and 293 deletions.
File renamed without changes.
File renamed without changes.
File renamed without changes.
File renamed without changes.
Original file line number Diff line number Diff line change
Expand Up @@ -6,14 +6,17 @@
<groupId>com.linkall</groupId>
<modelVersion>4.0.0</modelVersion>
<version>0.1.0-SNAPSHOT</version>
<artifactId>connector-mongodb</artifactId>
<artifactId>mongodb-source</artifactId>

<properties>
<maven.compiler.source>8</maven.compiler.source>
<maven.compiler.target>8</maven.compiler.target>
<debezium.version>1.9.4.Final</debezium.version>
<junit-jupiter.version>5.5.2</junit-jupiter.version>
<fastjson.version>1.2.83</fastjson.version>
<grpc.version>1.49.0</grpc.version>
<google.proto.version>3.21.5</google.proto.version>
<apache.commons.version>1.9</apache.commons.version>
</properties>
<dependencies>
<dependency>
Expand Down Expand Up @@ -45,11 +48,61 @@
<dependency>
<groupId>org.apache.commons</groupId>
<artifactId>commons-text</artifactId>
<version>1.9</version>
<version>${apache.commons.version}</version>
</dependency>
<dependency>
<groupId>io.grpc</groupId>
<artifactId>grpc-protobuf</artifactId>
<version>${grpc.version}</version>
</dependency>
<dependency>
<groupId>io.grpc</groupId>
<artifactId>grpc-stub</artifactId>
<version>${grpc.version}</version>
</dependency>
<dependency>
<groupId>com.google.protobuf</groupId>
<artifactId>protobuf-java</artifactId>
<version>${google.proto.version}</version>
</dependency>
<dependency>
<groupId>com.google.protobuf</groupId>
<artifactId>protobuf-java-util</artifactId>
<version>${google.proto.version}</version>
</dependency>
</dependencies>
<build>
<extensions>
<extension>
<groupId>kr.motd.maven</groupId>
<artifactId>os-maven-plugin</artifactId>
<version>1.6.0</version>
</extension>
</extensions>
<plugins>
<plugin>
<groupId>org.xolstice.maven.plugins</groupId>
<artifactId>protobuf-maven-plugin</artifactId>
<version>0.6.1</version>
<extensions>true</extensions>
<executions>
<execution>
<goals>
<goal>compile</goal>
<goal>test-compile</goal>
</goals>
</execution>
</executions>
<configuration>
<protoSourceRoot>../../schemas</protoSourceRoot>
<includes>
<include>database/database.proto</include>
<include>database/mongodb.proto</include>
<include>base/base.proto</include>
</includes>
<protocArtifact>com.google.protobuf:protoc:3.7.0:exe:${os.detected.classifier}</protocArtifact>
</configuration>
</plugin>
<plugin>
<groupId>org.apache.maven.plugins</groupId>
<artifactId>maven-assembly-plugin</artifactId>
Expand All @@ -63,7 +116,7 @@
<archive>
<manifest>
<mainClass>
com.linkall.source.mysql.Entrance
com.linkall.source.mongo.Entrance
</mainClass>
</manifest>
</archive>
Expand Down
File renamed without changes.
Original file line number Diff line number Diff line change
@@ -0,0 +1,172 @@
// Copyright 2022 Linkall Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

package com.linkall.connector.mongodb;

import com.alibaba.fastjson.JSON;
import com.alibaba.fastjson.JSONObject;
import com.fasterxml.jackson.databind.ObjectMapper;
import com.google.protobuf.Struct;
import com.google.protobuf.Value;
import com.google.protobuf.util.JsonFormat;
import com.linkall.connector.proto.Base;
import com.linkall.connector.proto.Database;
import com.linkall.connector.proto.Mongodb;
import com.linkall.vance.core.Adapter2;
import io.cloudevents.CloudEvent;
import io.cloudevents.core.builder.CloudEventBuilder;
import io.cloudevents.jackson.JsonCloudEventData;
import org.apache.commons.text.StringEscapeUtils;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.net.URI;
import java.nio.charset.StandardCharsets;
import java.time.Instant;
import java.time.OffsetDateTime;
import java.time.ZoneOffset;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;

public class MongoDBAdapter implements Adapter2 {
private static final Logger LOGGER = LoggerFactory.getLogger(MongoDBAdapter.class);
private static final String EXTENSION_NAME_PREFIX = "vancemongodb";
private static final List<String> keyFilter = new ArrayList<>();

static {
keyFilter.add("db");
keyFilter.add("collection");
keyFilter.add("connector");
keyFilter.add("rs");
keyFilter.add("ts_ms");
}

public static Mongodb.Event parse(String key, String value) {
Mongodb.Event.Builder builder = Mongodb.Event.newBuilder();
builder.getMetadataBuilder().setRecognized(true);
builder.getRawBuilder().setKey(key);
builder.getRawBuilder().setValue(value);
try {
JSONObject obj = JSON.parseObject(value);
Base.Metadata.Builder mdBuilder = builder.getMetadataBuilder();
Struct.Builder sb = Struct.newBuilder();
JsonFormat.parser().merge(obj.getJSONObject("source").toJSONString(), sb);
mdBuilder.setExtension(sb.build());
JSONObject id = JSON.parseObject(key);
if (id.containsKey("id")) {
mdBuilder.setId(id.getJSONObject("id").get("$oid").toString());
} else {
mdBuilder.setRecognized(false);
return builder.build();
}
switch (obj.getString("op")) {
case "u":
builder.setOp(Database.Operation.UPDATE);
JSONObject ud = obj.getJSONObject("updateDescription");

JsonFormat.parser().merge(
StringEscapeUtils.unescapeJava(
ud.getOrDefault("updatedFields", "{}").toString()
),
builder.getUpdateBuilder().getUpdateDescriptionBuilder().getUpdatedFieldsBuilder());
JsonFormat.parser().merge(
StringEscapeUtils.unescapeJava(
ud.getOrDefault("truncatedArrays", "[]").toString()
),
builder.getUpdateBuilder().getUpdateDescriptionBuilder().getTruncatedArraysBuilder());
JsonFormat.parser().merge(
StringEscapeUtils.unescapeJava(
ud.getOrDefault("removedFields", "[]").toString()
),
builder.getUpdateBuilder().getUpdateDescriptionBuilder().getRemovedFieldsBuilder());
case "c":
if (builder.getOp() == Database.Operation.UNKNOWN) {
builder.setOp(Database.Operation.INSERT);
}
JsonFormat.parser().merge(obj.getString("after"),
builder.getInsertBuilder().getDocumentBuilder());
break;
case "d":
builder.setOp(Database.Operation.DELETE);
break;
default:
builder.setOp(Database.Operation.UNKNOWN);
mdBuilder.setRecognized(false);
return builder.build();
}
} catch (Exception e) {
LOGGER.warn("parse event data failed: {}", e.getMessage());
builder.getMetadataBuilder().setRecognized(false);
}
return builder.build();
}

public static CloudEvent proto2CloudEvent(Mongodb.Event event) {
CloudEventBuilder builder = CloudEventBuilder.v1();

String ID = "unknown";
String sourcePrefix = "unknown.unknown";
String type = "unknown.unknown";
builder.withId(ID).withType(type).withSource(URI.create(sourcePrefix + "." + type));
try {
builder.withDataContentType("application/json");
Base.Metadata md = event.getMetadata();

if (md.getRecognized()) {
ID = event.getMetadata().getId();
sourcePrefix = md.getExtension().getFieldsMap().get("connector").getStringValue() + "."
+ md.getExtension().getFieldsMap().get("rs").getStringValue();

type = md.getExtension().getFieldsMap().get("db").getStringValue() + "." +
md.getExtension().getFieldsMap().get("collection").getStringValue();
builder.withId(ID).withType(type).withSource(URI.create(sourcePrefix + "." + type));
}

Value time = md.getExtension().getFieldsMap().get("ts_ms");
if (time != null) {
builder.withTime(
OffsetDateTime.ofInstant(
Instant.ofEpochMilli(
((Double) time.getNumberValue()).longValue()
),
ZoneOffset.UTC)
);
}

String data = JsonFormat.printer().omittingInsignificantWhitespace().print(event);
ObjectMapper mapper = new ObjectMapper();
builder.withData(JsonCloudEventData.wrap(mapper.readTree(data)));
for (Map.Entry<String, Value> entry : md.getExtension().getFieldsMap().entrySet()) {
if (!MongoDBAdapter.keyFilter.contains(entry.getKey()) && entry.getValue() != null) {
builder.withExtension(EXTENSION_NAME_PREFIX + entry.getKey(), entry.getValue().toString());
}
}

builder.withExtension(EXTENSION_NAME_PREFIX + "operation", event.getOp().toString());
} catch (Exception e) {
String data = "{\"raw\":{\"key\":\"" + event.getRaw().getKey() + "\",\"value\":\"" + event.getRaw().getValue() + "\"}}\n";
builder.withData(data.getBytes(StandardCharsets.UTF_8));
e.printStackTrace();
}
builder.withExtension(EXTENSION_NAME_PREFIX + "recognized", event.getMetadata().getRecognized());
return builder.build();
}

@Override
public CloudEvent adapt(Object key, Object val) {
return MongoDBAdapter.proto2CloudEvent(MongoDBAdapter.parse((String) key, (String) val));
}
}

Original file line number Diff line number Diff line change
Expand Up @@ -18,8 +18,6 @@
import com.linkall.connector.mongodb.debezium.DebeziumSource;
import com.linkall.vance.core.Adapter;
import org.apache.logging.log4j.util.Strings;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

import java.io.FileNotFoundException;
import java.io.IOException;
Expand Down
Loading

0 comments on commit ee09df1

Please sign in to comment.