kubernetes · k8s-github-robot · Feb 17, 2017 · Feb 17, 2017 · Feb 17, 2017
diff --git a/Godeps/Godeps.json b/Godeps/Godeps.json
diff --git a/Godeps/LICENSES b/Godeps/LICENSES
diff --git a/test/e2e/BUILD b/test/e2e/BUILD
@@ -16,7 +16,10 @@ go_library(
         "autoscaling_utils.go",
         "cadvisor.go",
         "cluster_logging_es.go",
+        "cluster_logging_es_utils.go",
         "cluster_logging_gcl.go",
+        "cluster_logging_gcl_load.go",
+        "cluster_logging_gcl_utils.go",
         "cluster_logging_utils.go",
         "cluster_size_autoscaling.go",
         "cluster_upgrade.go",
@@ -178,8 +181,10 @@ go_library(
         "//vendor:golang.org/x/crypto/ssh",
         "//vendor:golang.org/x/net/context",
         "//vendor:golang.org/x/net/websocket",
+        "//vendor:golang.org/x/oauth2/google",
         "//vendor:google.golang.org/api/compute/v1",
         "//vendor:google.golang.org/api/googleapi",
+        "//vendor:google.golang.org/api/logging/v2beta1",
         "//vendor:k8s.io/apimachinery/pkg/api/errors",
         "//vendor:k8s.io/apimachinery/pkg/api/resource",
         "//vendor:k8s.io/apimachinery/pkg/apis/meta/v1",
@@ -189,7 +194,6 @@ go_library(
         "//vendor:k8s.io/apimachinery/pkg/runtime/schema",
         "//vendor:k8s.io/apimachinery/pkg/types",
         "//vendor:k8s.io/apimachinery/pkg/util/intstr",
-        "//vendor:k8s.io/apimachinery/pkg/util/json",
         "//vendor:k8s.io/apimachinery/pkg/util/net",
         "//vendor:k8s.io/apimachinery/pkg/util/runtime",
         "//vendor:k8s.io/apimachinery/pkg/util/sets",

diff --git a/test/e2e/cluster_logging_es.go b/test/e2e/cluster_logging_es.go
@@ -17,24 +17,13 @@ limitations under the License.
 package e2e
 
 import (
-	"context"
-	"encoding/json"
 	"fmt"
-	"strconv"
-	"strings"
 	"time"
 
-	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
-	"k8s.io/apimachinery/pkg/labels"
+	meta_v1 "k8s.io/apimachinery/pkg/apis/meta/v1"
 	"k8s.io/kubernetes/test/e2e/framework"
 
 	. "github.com/onsi/ginkgo"
-	. "github.com/onsi/gomega"
-)
-
-const (
-	// graceTime is how long to keep retrying requesting elasticsearch for status information.
-	graceTime = 5 * time.Minute
 )
 
 var _ = framework.KubeDescribe("Cluster level logging using Elasticsearch [Feature:Elasticsearch]", func() {
@@ -48,241 +37,25 @@ var _ = framework.KubeDescribe("Cluster level logging using Elasticsearch [Featu
 	})
 
 	It("should check that logs from containers are ingested into Elasticsearch", func() {
-		err := checkElasticsearchReadiness(f)
-		framework.ExpectNoError(err, "Elasticsearch failed to start")
+		podName := "synthlogger"
+		esLogsProvider, err := newEsLogsProvider(f)
+		framework.ExpectNoError(err, "Failed to create GCL logs provider")
+
+		err = esLogsProvider.EnsureWorking()
+		framework.ExpectNoError(err, "Elasticsearch is not working")
 
 		By("Running synthetic logger")
-		createSynthLogger(f, expectedLinesCount)
-		defer f.PodClient().Delete(synthLoggerPodName, &metav1.DeleteOptions{})
-		err = framework.WaitForPodSuccessInNamespace(f.ClientSet, synthLoggerPodName, f.Namespace.Name)
-		framework.ExpectNoError(err, fmt.Sprintf("Should've successfully waited for pod %s to succeed", synthLoggerPodName))
+		pod := createLoggingPod(f, podName, 100, 1*time.Second)
+		defer f.PodClient().Delete(podName, &meta_v1.DeleteOptions{})
+		err = framework.WaitForPodSuccessInNamespace(f.ClientSet, podName, f.Namespace.Name)
+		framework.ExpectNoError(err, fmt.Sprintf("Should've successfully waited for pod %s to succeed", podName))
 
 		By("Waiting for logs to ingest")
-		totalMissing := expectedLinesCount
-		for start := time.Now(); time.Since(start) < ingestionTimeout; time.Sleep(ingestionRetryDelay) {
-			totalMissing, err = getMissingLinesCountElasticsearch(f, expectedLinesCount)
-			if err != nil {
-				framework.Logf("Failed to get missing lines count due to %v", err)
-				totalMissing = expectedLinesCount
-			} else if totalMissing > 0 {
-				framework.Logf("Still missing %d lines", totalMissing)
-			}
+		err = waitForLogsIngestion(esLogsProvider, []*loggingPod{pod}, 10*time.Minute, 0)
+		framework.ExpectNoError(err, "Failed to ingest logs")
 
-			if totalMissing == 0 {
-				break
-			}
-		}
-
-		if totalMissing > 0 {
-			if err := reportLogsFromFluentdPod(f); err != nil {
-				framework.Logf("Failed to report logs from fluentd pod due to %v", err)
-			}
+		if err != nil {
+			reportLogsFromFluentdPod(f, pod)
 		}
-
-		Expect(totalMissing).To(Equal(0), "Some log lines are still missing")
 	})
 })
-
-// Ensures that elasticsearch is running and ready to serve requests
-func checkElasticsearchReadiness(f *framework.Framework) error {
-	// Check for the existence of the Elasticsearch service.
-	By("Checking the Elasticsearch service exists.")
-	s := f.ClientSet.Core().Services(metav1.NamespaceSystem)
-	// Make a few attempts to connect. This makes the test robust against
-	// being run as the first e2e test just after the e2e cluster has been created.
-	var err error
-	for start := time.Now(); time.Since(start) < graceTime; time.Sleep(5 * time.Second) {
-		if _, err = s.Get("elasticsearch-logging", metav1.GetOptions{}); err == nil {
-			break
-		}
-		framework.Logf("Attempt to check for the existence of the Elasticsearch service failed after %v", time.Since(start))
-	}
-	Expect(err).NotTo(HaveOccurred())
-
-	// Wait for the Elasticsearch pods to enter the running state.
-	By("Checking to make sure the Elasticsearch pods are running")
-	label := labels.SelectorFromSet(labels.Set(map[string]string{"k8s-app": "elasticsearch-logging"}))
-	options := metav1.ListOptions{LabelSelector: label.String()}
-	pods, err := f.ClientSet.Core().Pods(metav1.NamespaceSystem).List(options)
-	Expect(err).NotTo(HaveOccurred())
-	for _, pod := range pods.Items {
-		err = framework.WaitForPodRunningInNamespace(f.ClientSet, &pod)
-		Expect(err).NotTo(HaveOccurred())
-	}
-
-	By("Checking to make sure we are talking to an Elasticsearch service.")
-	// Perform a few checks to make sure this looks like an Elasticsearch cluster.
-	var statusCode int
-	err = nil
-	var body []byte
-	for start := time.Now(); time.Since(start) < graceTime; time.Sleep(10 * time.Second) {
-		proxyRequest, errProxy := framework.GetServicesProxyRequest(f.ClientSet, f.ClientSet.Core().RESTClient().Get())
-		if errProxy != nil {
-			framework.Logf("After %v failed to get services proxy request: %v", time.Since(start), errProxy)
-			continue
-		}
-
-		ctx, cancel := context.WithTimeout(context.Background(), framework.SingleCallTimeout)
-		defer cancel()
-
-		// Query against the root URL for Elasticsearch.
-		response := proxyRequest.Namespace(metav1.NamespaceSystem).
-			Context(ctx).
-			Name("elasticsearch-logging").
-			Do()
-		err = response.Error()
-		response.StatusCode(&statusCode)
-
-		if err != nil {
-			if ctx.Err() != nil {
-				framework.Failf("After %v proxy call to elasticsearch-loigging failed: %v", time.Since(start), err)
-				continue
-			}
-			framework.Logf("After %v proxy call to elasticsearch-loigging failed: %v", time.Since(start), err)
-			continue
-		}
-		if int(statusCode) != 200 {
-			framework.Logf("After %v Elasticsearch cluster has a bad status: %v", time.Since(start), statusCode)
-			continue
-		}
-		break
-	}
-	Expect(err).NotTo(HaveOccurred())
-	if int(statusCode) != 200 {
-		framework.Failf("Elasticsearch cluster has a bad status: %v", statusCode)
-	}
-
-	// Now assume we really are talking to an Elasticsearch instance.
-	// Check the cluster health.
-	By("Checking health of Elasticsearch service.")
-	healthy := false
-	for start := time.Now(); time.Since(start) < graceTime; time.Sleep(5 * time.Second) {
-		proxyRequest, errProxy := framework.GetServicesProxyRequest(f.ClientSet, f.ClientSet.Core().RESTClient().Get())
-		if errProxy != nil {
-			framework.Logf("After %v failed to get services proxy request: %v", time.Since(start), errProxy)
-			continue
-		}
-
-		ctx, cancel := context.WithTimeout(context.Background(), framework.SingleCallTimeout)
-		defer cancel()
-
-		body, err = proxyRequest.Namespace(metav1.NamespaceSystem).
-			Context(ctx).
-			Name("elasticsearch-logging").
-			Suffix("_cluster/health").
-			Param("level", "indices").
-			DoRaw()
-		if err != nil {
-			if ctx.Err() != nil {
-				framework.Failf("Failed to get cluster health from elasticsearch: %v", err)
-			}
-			continue
-		}
-		health := make(map[string]interface{})
-		err := json.Unmarshal(body, &health)
-		if err != nil {
-			framework.Logf("Bad json response from elasticsearch: %v", err)
-			continue
-		}
-		statusIntf, ok := health["status"]
-		if !ok {
-			framework.Logf("No status field found in cluster health response: %v", health)
-			continue
-		}
-		status := statusIntf.(string)
-		if status != "green" && status != "yellow" {
-			framework.Logf("Cluster health has bad status: %v", health)
-			continue
-		}
-		if err == nil && ok {
-			healthy = true
-			break
-		}
-	}
-	if !healthy {
-		return fmt.Errorf("After %v elasticsearch cluster is not healthy", graceTime)
-	}
-
-	return nil
-}
-
-func getMissingLinesCountElasticsearch(f *framework.Framework, expectedCount int) (int, error) {
-	proxyRequest, errProxy := framework.GetServicesProxyRequest(f.ClientSet, f.ClientSet.Core().RESTClient().Get())
-	if errProxy != nil {
-		return 0, fmt.Errorf("Failed to get services proxy request: %v", errProxy)
-	}
-
-	ctx, cancel := context.WithTimeout(context.Background(), framework.SingleCallTimeout)
-	defer cancel()
-
-	// Ask Elasticsearch to return all the log lines that were tagged with the
-	// pod name. Ask for ten times as many log lines because duplication is possible.
-	body, err := proxyRequest.Namespace(metav1.NamespaceSystem).
-		Context(ctx).
-		Name("elasticsearch-logging").
-		Suffix("_search").
-		// TODO: Change filter to only match records from current test run
-		// after fluent-plugin-kubernetes_metadata_filter is enabled
-		// and optimize current query
-		Param("q", fmt.Sprintf("tag:*%s*", synthLoggerPodName)).
-		Param("size", strconv.Itoa(expectedCount*10)).
-		DoRaw()
-	if err != nil {
-		if ctx.Err() != nil {
-			framework.Failf("Failed to make proxy call to elasticsearch-logging: %v", err)
-		}
-		return 0, fmt.Errorf("Failed to make proxy call to elasticsearch-logging: %v", err)
-	}
-
-	var response map[string]interface{}
-	err = json.Unmarshal(body, &response)
-	if err != nil {
-		return 0, fmt.Errorf("Failed to unmarshal response: %v", err)
-	}
-
-	hits, ok := response["hits"].(map[string]interface{})
-	if !ok {
-		return 0, fmt.Errorf("response[hits] not of the expected type: %T", response["hits"])
-	}
-
-	h, ok := hits["hits"].([]interface{})
-	if !ok {
-		return 0, fmt.Errorf("Hits not of the expected type: %T", hits["hits"])
-	}
-
-	// Initialize data-structure for observing counts.
-	counts := make(map[int]int)
-
-	// Iterate over the hits and populate the observed array.
-	for _, e := range h {
-		l, ok := e.(map[string]interface{})
-		if !ok {
-			framework.Logf("Element of hit not of expected type: %T", e)
-			continue
-		}
-		source, ok := l["_source"].(map[string]interface{})
-		if !ok {
-			framework.Logf("_source not of the expected type: %T", l["_source"])
-			continue
-		}
-		msg, ok := source["log"].(string)
-		if !ok {
-			framework.Logf("Log not of the expected type: %T", source["log"])
-			continue
-		}
-		lineNumber, err := strconv.Atoi(strings.TrimSpace(msg))
-		if err != nil {
-			framework.Logf("Log line %s is not a number", msg)
-			continue
-		}
-		if lineNumber < 0 || lineNumber >= expectedCount {
-			framework.Logf("Number %d is not valid, expected number from range [0, %d)", lineNumber, expectedCount)
-			continue
-		}
-		// Record the observation of a log line
-		// Duplicates are possible and fine, fluentd has at-least-once delivery
-		counts[lineNumber]++
-	}
-
-	return expectedCount - len(counts), nil
-}