Add Zipkin Dependencies support of OpenSearch storage

Signed-off-by: Andriy Redko <[email protected]>
openzipkin · May 11, 2024 · 531842f · 531842f
1 parent 8e8ea60
commit 531842f
Show file tree

Hide file tree

Showing 11 changed files with 769 additions and 0 deletions.
diff --git a/opensearch/pom.xml b/opensearch/pom.xml
@@ -0,0 +1,71 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+
+    Copyright The OpenZipkin Authors
+    SPDX-License-Identifier: Apache-2.0
+
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+  <modelVersion>4.0.0</modelVersion>
+
+  <parent>
+    <groupId>io.zipkin.dependencies</groupId>
+    <artifactId>zipkin-dependencies-parent</artifactId>
+    <version>3.2.0-SNAPSHOT</version>
+  </parent>
+
+  <artifactId>zipkin-dependencies-opensearch</artifactId>
+  <name>Zipkin Dependencies: OpenSearch</name>
+
+  <properties>
+    <main.basedir>${project.basedir}/..</main.basedir>
+    <okhttp.version>4.12.0</okhttp.version>
+  </properties>
+
+  <dependencies>
+    <dependency>
+      <groupId>org.opensearch.client</groupId>
+      <artifactId>opensearch-spark-30_${scala.binary.version}</artifactId>
+      <version>${opensearch-spark.version}</version>
+    </dependency>
+
+    <dependency>
+      <groupId>io.zipkin.zipkin2</groupId>
+      <artifactId>zipkin-storage-elasticsearch</artifactId>
+      <version>${zipkin.version}</version>
+      <scope>test</scope>
+    </dependency>
+    <dependency>
+      <groupId>com.squareup.okhttp3</groupId>
+      <artifactId>mockwebserver</artifactId>
+      <version>${okhttp.version}</version>
+      <scope>test</scope>
+    </dependency>
+    <dependency>
+      <groupId>com.squareup.okhttp3</groupId>
+      <artifactId>okhttp-tls</artifactId>
+      <version>${okhttp.version}</version>
+      <scope>test</scope>
+    </dependency>
+    <!-- Temporarily override ES verson of SLF4J -->
+    <dependency>
+      <groupId>org.slf4j</groupId>
+      <artifactId>slf4j-api</artifactId>
+      <version>${slf4j.version}</version>
+    </dependency>
+
+    <!-- integration tests -->
+    <dependency>
+      <groupId>com.linecorp.armeria</groupId>
+      <artifactId>armeria-junit5</artifactId>
+      <version>${armeria.version}</version>
+      <scope>test</scope>
+    </dependency>
+    <dependency>
+      <groupId>org.testcontainers</groupId>
+      <artifactId>junit-jupiter</artifactId>
+      <version>${testcontainers.version}</version>
+      <scope>test</scope>
+    </dependency>
+  </dependencies>
+</project>
diff --git a/opensearch/src/main/java/zipkin2/dependencies/opensearch/OpensearchDependenciesJob.java b/opensearch/src/main/java/zipkin2/dependencies/opensearch/OpensearchDependenciesJob.java
@@ -0,0 +1,273 @@
+/*
+ * Copyright The OpenZipkin Authors
+ * SPDX-License-Identifier: Apache-2.0
+ */
+package zipkin2.dependencies.opensearch;
+
+import com.google.gson.stream.JsonReader;
+import com.google.gson.stream.MalformedJsonException;
+import java.io.IOException;
+import java.io.StringReader;
+import java.net.URI;
+import java.nio.charset.Charset;
+import java.text.SimpleDateFormat;
+import java.util.Collections;
+import java.util.Date;
+import java.util.LinkedHashMap;
+import java.util.Map;
+import java.util.TimeZone;
+import javax.annotation.Nullable;
+import org.apache.spark.SparkConf;
+import org.apache.spark.api.java.JavaRDD;
+import org.apache.spark.api.java.JavaSparkContext;
+import org.apache.spark.api.java.function.Function;
+import org.apache.spark.api.java.function.PairFunction;
+import org.opensearch.spark.rdd.api.java.JavaOpenSearchSpark;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+import scala.Tuple2;
+import zipkin2.DependencyLink;
+import zipkin2.codec.SpanBytesDecoder;
+
+import static com.google.common.base.Preconditions.checkNotNull;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_INDEX_READ_MISSING_AS_EMPTY;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_NET_HTTP_AUTH_PASS;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_NET_HTTP_AUTH_USER;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_NET_SSL_KEYSTORE_LOCATION;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_NET_SSL_KEYSTORE_PASS;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_NET_SSL_TRUST_STORE_LOCATION;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_NET_SSL_TRUST_STORE_PASS;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_NET_USE_SSL;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_NODES;
+import static org.opensearch.hadoop.cfg.ConfigurationOptions.OPENSEARCH_NODES_WAN_ONLY;
+import static zipkin2.internal.DateUtil.midnightUTC;
+
+public final class OpensearchDependenciesJob {
+  static final Charset UTF_8 = Charset.forName("UTF-8");
+
+  private static final Logger log = LoggerFactory.getLogger(OpensearchDependenciesJob.class);
+
+  public static Builder builder() {
+    return new Builder();
+  }
+
+  public static final class Builder {
+
+    String index = getEnv("ES_INDEX", "zipkin");
+    String hosts = getEnv("ES_HOSTS", "127.0.0.1");
+    String username = getEnv("ES_USERNAME", null);
+    String password = getEnv("ES_PASSWORD", null);
+
+    final Map<String, String> sparkProperties = new LinkedHashMap<>();
+
+    Builder() {
+      sparkProperties.put("spark.ui.enabled", "false");
+      // don't die if there are no spans
+      sparkProperties.put(OPENSEARCH_INDEX_READ_MISSING_AS_EMPTY, "true");
+      sparkProperties.put(OPENSEARCH_NODES_WAN_ONLY, getEnv("ES_NODES_WAN_ONLY", "false"));
+      sparkProperties.put(OPENSEARCH_NET_SSL_KEYSTORE_LOCATION,
+        getSystemPropertyAsFileResource("javax.net.ssl.keyStore"));
+      sparkProperties.put(OPENSEARCH_NET_SSL_KEYSTORE_PASS,
+        System.getProperty("javax.net.ssl.keyStorePassword", ""));
+      sparkProperties.put(OPENSEARCH_NET_SSL_TRUST_STORE_LOCATION,
+        getSystemPropertyAsFileResource("javax.net.ssl.trustStore"));
+      sparkProperties.put(OPENSEARCH_NET_SSL_TRUST_STORE_PASS,
+        System.getProperty("javax.net.ssl.trustStorePassword", ""));
+    }
+
+    // local[*] master lets us run & test the job locally without setting a Spark cluster
+    String sparkMaster = getEnv("SPARK_MASTER", "local[*]");
+    // needed when not in local mode
+    String[] jars;
+    Runnable logInitializer;
+
+    // By default, the job only works on traces whose first timestamp is today
+    long day = midnightUTC(System.currentTimeMillis());
+
+    /** When set, this indicates which jars to distribute to the cluster. */
+    public Builder jars(String... jars) {
+      this.jars = jars;
+      return this;
+    }
+
+    /** The index prefix to use when generating daily index names. Defaults to "zipkin" */
+    public Builder index(String index) {
+      this.index = checkNotNull(index, "index");
+      return this;
+    }
+
+    public Builder hosts(String hosts) {
+      this.hosts = checkNotNull(hosts, "hosts");
+      sparkProperties.put("opensearch.nodes.wan.only", "true");
+      return this;
+    }
+
+    /** username used for basic auth. Needed when Shield or X-Pack security is enabled */
+    public Builder username(String username) {
+      this.username = username;
+      return this;
+    }
+
+    /** password used for basic auth. Needed when Shield or X-Pack security is enabled */
+    public Builder password(String password) {
+      this.password = password;
+      return this;
+    }
+
+    /** Day (in epoch milliseconds) to process dependencies for. Defaults to today. */
+    public Builder day(long day) {
+      this.day = midnightUTC(day);
+      return this;
+    }
+
+    /** Extending more configuration of spark. */
+    public Builder conf(Map<String, String> conf) {
+      sparkProperties.putAll(conf);
+      return this;
+    }
+
+    /** Ensures that logging is set up. Particularly important when in cluster mode. */
+    public Builder logInitializer(Runnable logInitializer) {
+      this.logInitializer = checkNotNull(logInitializer, "logInitializer");
+      return this;
+    }
+
+    public OpensearchDependenciesJob build() {
+      return new OpensearchDependenciesJob(this);
+    }
+  }
+
+  private static String getSystemPropertyAsFileResource(String key) {
+    String prop = System.getProperty(key, "");
+    return prop != null && !prop.isEmpty() ? "file:" + prop : prop;
+  }
+
+  final String index;
+  final String dateStamp;
+  final SparkConf conf;
+  @Nullable final Runnable logInitializer;
+
+  OpensearchDependenciesJob(Builder builder) {
+    this.index = builder.index;
+    String dateSeparator = getEnv("ES_DATE_SEPARATOR", "-");
+    SimpleDateFormat df = new SimpleDateFormat("yyyy-MM-dd".replace("-", dateSeparator));
+    df.setTimeZone(TimeZone.getTimeZone("UTC"));
+    this.dateStamp = df.format(new Date(builder.day));
+    this.conf = new SparkConf(true).setMaster(builder.sparkMaster).setAppName(getClass().getName());
+    if (builder.sparkMaster.startsWith("local[")) {
+      conf.set("spark.driver.bindAddress", "127.0.0.1");
+    }
+    if (builder.jars != null) conf.setJars(builder.jars);
+    if (builder.username != null) conf.set(OPENSEARCH_NET_HTTP_AUTH_USER, builder.username);
+    if (builder.password != null) conf.set(OPENSEARCH_NET_HTTP_AUTH_PASS, builder.password);
+    conf.set(OPENSEARCH_NODES, parseHosts(builder.hosts));
+    if (builder.hosts.contains("https")) conf.set(OPENSEARCH_NET_USE_SSL, "true");
+    for (Map.Entry<String, String> entry : builder.sparkProperties.entrySet()) {
+      conf.set(entry.getKey(), entry.getValue());
+      log.debug("Spark conf properties: {}={}", entry.getKey(), entry.getValue());
+    }
+    this.logInitializer = builder.logInitializer;
+  }
+
+  public void run() {
+    String spanResource = index + "-span-" + dateStamp;
+    String dependencyLinkResource = index + "-dependency-" + dateStamp;
+    SpanBytesDecoder decoder = SpanBytesDecoder.JSON_V2;
+
+    log.info("Processing spans from {}", spanResource);
+    JavaRDD<Map<String, Object>> links;
+    try (JavaSparkContext sc = new JavaSparkContext(conf)) {
+      links = JavaOpenSearchSpark.openSearchJsonRDD(sc, spanResource)
+        .groupBy(JSON_TRACE_ID)
+        .flatMapValues(new TraceIdAndJsonToDependencyLinks(logInitializer, decoder))
+        .values()
+        .mapToPair((PairFunction<DependencyLink, Tuple2<String, String>, DependencyLink>) l ->
+          new Tuple2<>(new Tuple2<>(l.parent(), l.child()), l))
+        .reduceByKey((l, r) -> DependencyLink.newBuilder()
+          .parent(l.parent())
+          .child(l.child())
+          .callCount(l.callCount() + r.callCount())
+          .errorCount(l.errorCount() + r.errorCount())
+          .build())
+        .values()
+        .map(DEPENDENCY_LINK_JSON);
+
+      if (links.isEmpty()) {
+        log.info("No dependency links could be processed from spans in index {}", spanResource);
+      } else {
+        log.info("Saving dependency links to {}", dependencyLinkResource);
+        JavaOpenSearchSpark.saveToOpenSearch(
+          links,
+          dependencyLinkResource,
+          Collections.singletonMap("opensearch.mapping.id", "id")); // allows overwriting the link
+      }
+    }
+
+    log.info("Done");
+  }
+
+  /**
+   * Same as {@linkplain DependencyLink}, except it adds an ID field so the job can be re-run,
+   * overwriting a prior run's value for the link.
+   */
+  static final Function<DependencyLink, Map<String, Object>> DEPENDENCY_LINK_JSON = l -> {
+    Map<String, Object> result = new LinkedHashMap<>();
+    result.put("id", l.parent() + "|" + l.child());
+    result.put("parent", l.parent());
+    result.put("child", l.child());
+    result.put("callCount", l.callCount());
+    result.put("errorCount", l.errorCount());
+    return result;
+  };
+
+  private static String getEnv(String key, String defaultValue) {
+    String result = System.getenv(key);
+    return result != null && !result.isEmpty() ? result : defaultValue;
+  }
+
+  static String parseHosts(String hosts) {
+    StringBuilder to = new StringBuilder();
+    String[] hostParts = hosts.split(",", -1);
+    for (int i = 0; i < hostParts.length; i++) {
+      String host = hostParts[i];
+      if (host.startsWith("http")) {
+        URI httpUri = URI.create(host);
+        int port = httpUri.getPort();
+        if (port == -1) {
+          port = host.startsWith("https") ? 443 : 80;
+        }
+        to.append(httpUri.getHost()).append(":").append(port);
+      } else {
+        to.append(host);
+      }
+      if (i + 1 < hostParts.length) {
+        to.append(',');
+      }
+    }
+    return to.toString();
+  }
+
+  // defining what could be lambdas here until we update to minimum JRE 8 or retrolambda works.
+  static final Function<Tuple2<String, String>, String> JSON_TRACE_ID =
+    new Function<Tuple2<String, String>, String>() {
+      /** returns the lower 64 bits of the trace ID */
+      @Override public String call(Tuple2<String, String> pair) throws IOException {
+        JsonReader reader = new JsonReader(new StringReader(pair._2));
+        reader.beginObject();
+        while (reader.hasNext()) {
+          String nextName = reader.nextName();
+          if (nextName.equals("traceId")) {
+            String traceId = reader.nextString();
+            return traceId.length() > 16 ? traceId.substring(traceId.length() - 16) : traceId;
+          } else {
+            reader.skipValue();
+          }
+        }
+        throw new MalformedJsonException("no traceId in " + pair);
+      }
+
+      @Override public String toString() {
+        return "pair._2.traceId";
+      }
+    };
+}
diff --git a/...search/src/main/java/zipkin2/dependencies/opensearch/TraceIdAndJsonToDependencyLinks.java b/...search/src/main/java/zipkin2/dependencies/opensearch/TraceIdAndJsonToDependencyLinks.java
@@ -0,0 +1,49 @@
+/*
+ * Copyright The OpenZipkin Authors
+ * SPDX-License-Identifier: Apache-2.0
+ */
+package zipkin2.dependencies.opensearch;
+
+import java.io.Serializable;
+import java.util.ArrayList;
+import java.util.Iterator;
+import java.util.List;
+import javax.annotation.Nullable;
+import org.apache.spark.api.java.function.FlatMapFunction;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+import scala.Tuple2;
+import zipkin2.DependencyLink;
+import zipkin2.Span;
+import zipkin2.codec.SpanBytesDecoder;
+import zipkin2.internal.DependencyLinker;
+
+final class TraceIdAndJsonToDependencyLinks
+  implements Serializable, FlatMapFunction<Iterable<Tuple2<String, String>>, DependencyLink> {
+  private static final long serialVersionUID = 0L;
+  private static final Logger log = LoggerFactory.getLogger(TraceIdAndJsonToDependencyLinks.class);
+
+  @Nullable final Runnable logInitializer;
+  final SpanBytesDecoder decoder;
+
+  TraceIdAndJsonToDependencyLinks(Runnable logInitializer, SpanBytesDecoder decoder) {
+    this.logInitializer = logInitializer;
+    this.decoder = decoder;
+  }
+
+  @Override
+  public Iterator<DependencyLink> call(Iterable<Tuple2<String, String>> traceIdJson) {
+    if (logInitializer != null) logInitializer.run();
+    List<Span> sameTraceId = new ArrayList<>();
+    for (Tuple2<String, String> row : traceIdJson) {
+      try {
+        decoder.decode(row._2.getBytes(OpensearchDependenciesJob.UTF_8), sameTraceId);
+      } catch (Exception e) {
+        log.warn("Unable to decode span from traces where trace_id=" + row._1, e);
+      }
+    }
+    DependencyLinker linker = new DependencyLinker();
+    linker.putTrace(sameTraceId);
+    return linker.link().iterator();
+  }
+}