From 1638a0071dc67895cb86b37d79f55d2c200db31f Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Tue, 28 May 2024 08:32:37 +0300 Subject: [PATCH 01/30] Add logs-endpoint env-var injection --- controller/src/mutation/mutate.go | 14 ++++++++++++++ 1 file changed, 14 insertions(+) diff --git a/controller/src/mutation/mutate.go b/controller/src/mutation/mutate.go index ee68cc2..c32670c 100644 --- a/controller/src/mutation/mutate.go +++ b/controller/src/mutation/mutate.go @@ -46,6 +46,7 @@ const LumigoInjectorVolumeName = "lumigo-injector" const LumigoInjectorVolumeMountPoint = "/opt/lumigo" const LumigoTracerTokenEnvVarName = "LUMIGO_TRACER_TOKEN" const LumigoEndpointEnvVarName = "LUMIGO_ENDPOINT" +const LumigoLogsEndpointEnvVarName = "LUMIGO_LOGS_ENDPOINT" const LumigoContainerNameEnvVarName = "LUMIGO_CONTAINER_NAME" const LdPreloadEnvVarName = "LD_PRELOAD" const LdPreloadEnvVarValue = LumigoInjectorVolumeMountPoint + "/injector/lumigo_injector.so" @@ -78,6 +79,7 @@ type mutatorImpl struct { log *logr.Logger lumigoAutotraceLabelValue string lumigoEndpoint string + lumigoLogsEndpoint string lumigoToken *operatorv1alpha1.Credentials lumigoInjectorImage string } @@ -403,6 +405,18 @@ func (m *mutatorImpl) injectLumigoIntoPodSpec(podSpec *corev1.PodSpec) error { } else { envVars[lumigoEndpointEnvVarIndex] = *lumigoEndpointEnvVar } + + lumigoLogsEndpointEnvVar := &corev1.EnvVar{ + Name: LumigoLogsEndpointEnvVarName, + Value: m.lumigoLogsEndpoint, + } + lumigoLogsEndpointEnvVarIndex := slices.IndexFunc(envVars, func(c corev1.EnvVar) bool { return c.Name == LumigoLogsEndpointEnvVarName }) + if lumigoLogsEndpointEnvVarIndex < 0 { + envVars = append(envVars, *lumigoLogsEndpointEnvVar) + } else { + envVars[lumigoLogsEndpointEnvVarIndex] = *lumigoLogsEndpointEnvVar + } + lumigoContainerNameEnvVar := &corev1.EnvVar{ Name: LumigoContainerNameEnvVarName, Value: container.Name, From f296a8b172fc1a00f2929ec95bb75a745bba4810 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Tue, 28 May 2024 11:19:17 +0300 Subject: [PATCH 02/30] Update CONTRIBUTING guide --- CONTRIBUTING.md | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md index a54337b..d182878 100644 --- a/CONTRIBUTING.md +++ b/CONTRIBUTING.md @@ -30,6 +30,8 @@ Start `minikube`: minikube start --insecure-registry "host.docker.internal:5000" ``` +* Note that if the minikube machine already exists, you will need to delete it first with `minikube delete` - otherwise the `--insecure-registry` parameter will be ignored (more details [here](https://stackoverflow.com/a/53937716)) + Start a local Docker registry: ```sh @@ -46,7 +48,7 @@ $ curl localhost:5000/v2/_catalog -v > Host: localhost:5000 > User-Agent: curl/7.77.0 > Accept: */* -> +> * Mark bundle as not supporting multiuse < HTTP/1.1 200 OK < Content-Type: application/json; charset=utf-8 @@ -54,7 +56,7 @@ $ curl localhost:5000/v2/_catalog -v < X-Content-Type-Options: nosniff < Date: Fri, 20 Jan 2023 08:10:32 GMT < Content-Length: 20 -< +< {"repositories":[]} * Connection #0 to host localhost left intact ``` @@ -123,8 +125,8 @@ If you see the following, it's likely because and Mac OS has [squatted over port docker push host.docker.internal:5000/controller Using default tag: latest The push refers to repository [host.docker.internal:5000/controller] -377b701db379: Preparing -fba4381f2bb7: Preparing +377b701db379: Preparing +fba4381f2bb7: Preparing error parsing HTTP 403 response body: unexpected end of JSON input: "" ``` From 9c7b6ef8188d71487d2af142a2721e380cb271ce Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Tue, 28 May 2024 15:20:24 +0300 Subject: [PATCH 03/30] Propagate env-var, value is empty --- .../src/controllers/lumigo_controller.go | 5 +- controller/src/main.go | 18 +-- controller/src/mutation/mutate.go | 3 +- .../src/webhooks/injector/injector_webhook.go | 11 +- .../injector/injector_webhook_suite_test.go | 12 +- .../k8sdataenricherprocessor/processor.go | 117 +++++++++++++++++- 6 files changed, 144 insertions(+), 22 deletions(-) diff --git a/controller/src/controllers/lumigo_controller.go b/controller/src/controllers/lumigo_controller.go index 25f165f..ced1b06 100644 --- a/controller/src/controllers/lumigo_controller.go +++ b/controller/src/controllers/lumigo_controller.go @@ -77,6 +77,7 @@ type LumigoReconciler struct { LumigoOperatorVersion string LumigoInjectorImage string TelemetryProxyOtlpServiceUrl string + TelemetryProxyOtlpLogsServiceUrl string TelemetryProxyNamespaceConfigurationsPath string } @@ -489,7 +490,7 @@ func (r *LumigoReconciler) updateStatusIfNeeded(ctx context.Context, logger logr } func (r *LumigoReconciler) injectLumigoIntoResources(ctx context.Context, lumigo *operatorv1alpha1.Lumigo, log *logr.Logger) error { - mutator, err := mutation.NewMutator(log, &lumigo.Spec.LumigoToken, r.LumigoOperatorVersion, r.LumigoInjectorImage, r.TelemetryProxyOtlpServiceUrl) + mutator, err := mutation.NewMutator(log, &lumigo.Spec.LumigoToken, r.LumigoOperatorVersion, r.LumigoInjectorImage, r.TelemetryProxyOtlpServiceUrl, r.TelemetryProxyOtlpLogsServiceUrl) if err != nil { return fmt.Errorf("cannot instantiate mutator: %w", err) } @@ -688,7 +689,7 @@ func (r *LumigoReconciler) injectLumigoIntoResources(ctx context.Context, lumigo func (r *LumigoReconciler) removeLumigoFromResources(ctx context.Context, lumigo *operatorv1alpha1.Lumigo, log *logr.Logger) error { namespace := lumigo.Namespace - mutator, err := mutation.NewMutator(log, nil, r.LumigoOperatorVersion, r.LumigoInjectorImage, r.TelemetryProxyOtlpServiceUrl) + mutator, err := mutation.NewMutator(log, nil, r.LumigoOperatorVersion, r.LumigoInjectorImage, r.TelemetryProxyOtlpServiceUrl, r.TelemetryProxyOtlpLogsServiceUrl) if err != nil { return fmt.Errorf("cannot instantiate mutator: %w", err) } diff --git a/controller/src/main.go b/controller/src/main.go index b1521db..4c4f622 100644 --- a/controller/src/main.go +++ b/controller/src/main.go @@ -129,6 +129,7 @@ func startManager(metricsAddr string, probeAddr string, enableLeaderElection boo } telemetryProxyOtlpService := lumigoEndpoint + "/v1/traces" // TODO: Fix it when the distros use the Lumigo endpoint as root + telemetryProxyOtlpLogsService := lumigoEndpoint + "/v1/logs" namespaceConfigurationsPath, isSet := os.LookupEnv("LUMIGO_NAMESPACE_CONFIGURATIONS") if !isSet { @@ -151,14 +152,15 @@ func startManager(metricsAddr string, probeAddr string, enableLeaderElection boo } if err = (&controllers.LumigoReconciler{ - Client: mgr.GetClient(), - Clientset: clientset, - DynamicClient: dynamicClient, - EventRecorder: mgr.GetEventRecorderFor(fmt.Sprintf("lumigo-operator.v%s/controller", lumigoOperatorVersion)), - Scheme: mgr.GetScheme(), - LumigoOperatorVersion: lumigoOperatorVersion, - LumigoInjectorImage: lumigoInjectorImage, - TelemetryProxyOtlpServiceUrl: telemetryProxyOtlpService, + Client: mgr.GetClient(), + Clientset: clientset, + DynamicClient: dynamicClient, + EventRecorder: mgr.GetEventRecorderFor(fmt.Sprintf("lumigo-operator.v%s/controller", lumigoOperatorVersion)), + Scheme: mgr.GetScheme(), + LumigoOperatorVersion: lumigoOperatorVersion, + LumigoInjectorImage: lumigoInjectorImage, + TelemetryProxyOtlpServiceUrl: telemetryProxyOtlpService, + TelemetryProxyOtlpLogsServiceUrl: telemetryProxyOtlpLogsService, TelemetryProxyNamespaceConfigurationsPath: namespaceConfigurationsPath, Log: logger, }).SetupWithManager(mgr); err != nil { diff --git a/controller/src/mutation/mutate.go b/controller/src/mutation/mutate.go index c32670c..94065a9 100644 --- a/controller/src/mutation/mutate.go +++ b/controller/src/mutation/mutate.go @@ -88,7 +88,7 @@ func (m *mutatorImpl) GetAutotraceLabelValue() string { return m.lumigoAutotraceLabelValue } -func NewMutator(Log *logr.Logger, LumigoToken *operatorv1alpha1.Credentials, LumigoOperatorVersion string, LumigoInjectorImage string, TelemetryProxyOtlpServiceUrl string) (Mutator, error) { +func NewMutator(Log *logr.Logger, LumigoToken *operatorv1alpha1.Credentials, LumigoOperatorVersion string, LumigoInjectorImage string, TelemetryProxyOtlpServiceUrl string, TelemetryProxyOtlpLogsServiceUrl string) (Mutator, error) { version := LumigoOperatorVersion if len(version) > 8 { @@ -99,6 +99,7 @@ func NewMutator(Log *logr.Logger, LumigoToken *operatorv1alpha1.Credentials, Lum log: Log, lumigoAutotraceLabelValue: LumigoAutoTraceLabelVersionPrefixValue + version, lumigoEndpoint: TelemetryProxyOtlpServiceUrl, + lumigoLogsEndpoint: TelemetryProxyOtlpLogsServiceUrl, lumigoToken: LumigoToken, lumigoInjectorImage: LumigoInjectorImage, }, nil diff --git a/controller/src/webhooks/injector/injector_webhook.go b/controller/src/webhooks/injector/injector_webhook.go index 760f171..5a44767 100644 --- a/controller/src/webhooks/injector/injector_webhook.go +++ b/controller/src/webhooks/injector/injector_webhook.go @@ -50,10 +50,11 @@ type LumigoInjectorWebhookHandler struct { client.Client record.EventRecorder *admission.Decoder - LumigoOperatorVersion string - LumigoInjectorImage string - TelemetryProxyOtlpServiceUrl string - Log logr.Logger + LumigoOperatorVersion string + LumigoInjectorImage string + TelemetryProxyOtlpServiceUrl string + TelemetryProxyOtlpLogsServiceUrl string + Log logr.Logger } func (h *LumigoInjectorWebhookHandler) SetupWebhookWithManager(mgr ctrl.Manager) error { @@ -132,7 +133,7 @@ func (h *LumigoInjectorWebhookHandler) Handle(ctx context.Context, request admis return admission.Allowed(fmt.Sprintf("The Lumigo object in the '%s' namespace is not active; resource will not be mutated", namespace)) } - mutator, err := mutation.NewMutator(&log, &lumigo.Spec.LumigoToken, h.LumigoOperatorVersion, h.LumigoInjectorImage, h.TelemetryProxyOtlpServiceUrl) + mutator, err := mutation.NewMutator(&log, &lumigo.Spec.LumigoToken, h.LumigoOperatorVersion, h.LumigoInjectorImage, h.TelemetryProxyOtlpServiceUrl, h.TelemetryProxyOtlpLogsServiceUrl) if err != nil { return admission.Allowed(fmt.Errorf("cannot instantiate mutator: %w", err).Error()) } diff --git a/controller/src/webhooks/injector/injector_webhook_suite_test.go b/controller/src/webhooks/injector/injector_webhook_suite_test.go index bb872f2..ef0e977 100644 --- a/controller/src/webhooks/injector/injector_webhook_suite_test.go +++ b/controller/src/webhooks/injector/injector_webhook_suite_test.go @@ -64,6 +64,7 @@ var lumigoApiVersion = fmt.Sprintf("%s/%s", operatorv1alpha1.GroupVersion.Group, var lumigoOperatorVersion = "2b1e6b60ca871edee1d8f543c400f0b24663349144b78c79cfa006efaad6176a" // Unrealistically long, but we need to ensure we don't set label values too long var lumigoInjectorImage = "localhost:5000/lumigo-autotrace:test" var telemetryProxyOtlpServiceUrl = "lumigo-telemetry-proxy.lumigo-system.svc.cluster.local" +var telemetryProxyOtlpLogsServiceUrl = telemetryProxyOtlpServiceUrl var statusActive = operatorv1alpha1.LumigoStatus{ Conditions: []operatorv1alpha1.LumigoCondition{ @@ -174,11 +175,12 @@ var _ = BeforeSuite(func() { Expect(err).NotTo(HaveOccurred()) err = (&LumigoInjectorWebhookHandler{ - EventRecorder: mgr.GetEventRecorderFor(fmt.Sprintf("lumigo-operator.v%s", lumigoOperatorVersion)), - LumigoOperatorVersion: lumigoOperatorVersion, - LumigoInjectorImage: lumigoInjectorImage, - TelemetryProxyOtlpServiceUrl: telemetryProxyOtlpServiceUrl, - Log: ctrl.Log.WithName("injector-webhook").WithName("Lumigo"), + EventRecorder: mgr.GetEventRecorderFor(fmt.Sprintf("lumigo-operator.v%s", lumigoOperatorVersion)), + LumigoOperatorVersion: lumigoOperatorVersion, + LumigoInjectorImage: lumigoInjectorImage, + TelemetryProxyOtlpServiceUrl: telemetryProxyOtlpServiceUrl, + TelemetryProxyOtlpLogsServiceUrl: telemetryProxyOtlpLogsServiceUrl, + Log: ctrl.Log.WithName("injector-webhook").WithName("Lumigo"), }).SetupWebhookWithManager(mgr) Expect(err).NotTo(HaveOccurred()) diff --git a/telemetryproxy/src/processor/k8sdataenricherprocessor/processor.go b/telemetryproxy/src/processor/k8sdataenricherprocessor/processor.go index ac68c2f..41890b4 100644 --- a/telemetryproxy/src/processor/k8sdataenricherprocessor/processor.go +++ b/telemetryproxy/src/processor/k8sdataenricherprocessor/processor.go @@ -226,6 +226,7 @@ func (kp *kubernetesprocessor) processLogs(ctx context.Context, ld plog.Logs) (p func (kp *kubernetesprocessor) processResourceLogs(ctx context.Context, resourceLogs *plog.ResourceLogs) { scopeLogs := resourceLogs.ScopeLogs() + for i := 0; i < scopeLogs.Len(); i++ { sl := scopeLogs.At(i) @@ -244,7 +245,121 @@ func (kp *kubernetesprocessor) processResourceLogs(ctx context.Context, resource } default: { - kp.logger.Error("Unexpected logs scope", zap.String("scope-name", sl.Scope().Name())) + resource := resourceLogs.Resource() + resourceAttributes := resourceLogs.Resource().Attributes() + + resourceAttributes.PutStr(K8SProviderIdKey, kp.kube.GetProviderId()) + resourceAttributes.PutStr(K8SClusterUIDKey, string(kp.clusterUid)) + + pod, found := kp.getPod(ctx, &resource) + if !found { + kp.logger.Debug( + "Cannot find pod by 'k8s.pod.uid' of by connection ip", + zap.Any("resource-attributes", resourceAttributes.AsRaw()), + ) + continue + } + resourceAttributes.PutStr(K8SNodeNameKey, pod.Spec.NodeName) + + // Ensure 'k8s.pod.uid' is set (we might have found the pod via the network connection ip) + if _, found := resourceAttributes.Get(string(semconv.K8SPodUIDKey)); !found { + resourceAttributes.PutStr(string(semconv.K8SPodUIDKey), string(pod.UID)) + } + + resourceAttributes.PutStr(string(semconv.K8SPodNameKey), pod.Name) + + resourceAttributes.PutStr(string(semconv.K8SNamespaceNameKey), pod.Namespace) + if namespace, nsFound := kp.kube.GetNamespaceByName(pod.Namespace); nsFound { + resourceAttributes.PutStr("k8s.namespace.uid", string(namespace.UID)) + } else { + kp.logger.Error( + "Cannot add namespace resource attributes to traces, namespace not found", + zap.String("namespace", pod.Namespace), + ) + } + + ownerObject, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, pod) + if err != nil { + kp.logger.Error( + "Cannot look up owner reference for pod", + zap.Any("pod", pod), + zap.Error(err), + ) + } + + if !found { + kp.logger.Debug( + "Pod has no owner reference we can use to add other resource attributes", + zap.Any("pod", pod), + ) + continue + } + + switch podOwner := ownerObject.(type) { + case *appsv1.DaemonSet: + { + resourceAttributes.PutStr(string(semconv.K8SDaemonSetNameKey), podOwner.Name) + resourceAttributes.PutStr(string(semconv.K8SDaemonSetUIDKey), string(podOwner.UID)) + } + case *appsv1.ReplicaSet: + { + resourceAttributes.PutStr(string(semconv.K8SReplicaSetNameKey), podOwner.Name) + resourceAttributes.PutStr(string(semconv.K8SReplicaSetUIDKey), string(podOwner.UID)) + + if replicaSetOwner, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, podOwner); found { + if deployment, ok := replicaSetOwner.(*appsv1.Deployment); ok { + resourceAttributes.PutStr(string(semconv.K8SDeploymentNameKey), deployment.Name) + resourceAttributes.PutStr(string(semconv.K8SDeploymentUIDKey), string(deployment.UID)) + } else { + kp.logger.Error( + "Cannot add deployment resource attributes to traces, replicaset's owner object is not a *apps/v1.Deployment", + zap.Any("owner-object", ownerObject), + zap.Error(err), + ) + } + } else { + kp.logger.Debug( + "Cannot add deployment resource attributes to traces, replicaset has no deployment owner", + zap.Any("replicaset", podOwner), + zap.Error(err), + ) + } + } + case *appsv1.StatefulSet: + { + resourceAttributes.PutStr(string(semconv.K8SStatefulSetNameKey), podOwner.Name) + resourceAttributes.PutStr(string(semconv.K8SStatefulSetUIDKey), string(podOwner.UID)) + } + case *batchv1.Job: + { + resourceAttributes.PutStr(string(semconv.K8SJobNameKey), podOwner.Name) + resourceAttributes.PutStr(string(semconv.K8SJobUIDKey), string(podOwner.UID)) + + if jobOwner, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, podOwner); found { + if cronJob, ok := jobOwner.(*batchv1.CronJob); ok { + resourceAttributes.PutStr(string(semconv.K8SCronJobNameKey), cronJob.Name) + resourceAttributes.PutStr(string(semconv.K8SCronJobUIDKey), string(cronJob.UID)) + } else { + kp.logger.Error( + "Cannot add cronjob resource attributes to traces, job's object is not a *batch/v1.CronJob", + zap.Any("owner-object", ownerObject), + zap.Error(err), + ) + } + } else { + kp.logger.Debug( + "Cannot add cronjob resource attributes to traces, job has no cronjob owner", + zap.Any("job", podOwner), + zap.Error(err), + ) + } + } + default: + { + kp.logger.Error("Unexpected owner-object for pod", zap.Any("pod", pod), zap.Any("owner-object", ownerObject)) + } + } + return } } } From bc5be5e33151bc2d05a8253b7c81e4996d9b1003 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Tue, 28 May 2024 15:20:41 +0300 Subject: [PATCH 04/30] Fix docs --- CONTRIBUTING.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md index d182878..a9fa625 100644 --- a/CONTRIBUTING.md +++ b/CONTRIBUTING.md @@ -102,7 +102,7 @@ Changing the target Lumigo backend can be done with a [`patchStrategicMerge`](ht echo -n "apiVersion: apps/v1 kind: Deployment metadata: - name: lumigo-controller-manager + name: lumigo-lumigo-controller-manager spec: template: spec: From a2f46fc58affe84c4326924b9b1785fed2e60acb Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Wed, 29 May 2024 12:06:58 +0300 Subject: [PATCH 05/30] Add pipeline --- config/manager/manager.yaml | 2 + helm.yaml | 2 + telemetryproxy/docker/etc/config.yaml.tpl | 15 + .../k8sdataenricherprocessor/processor.go | 316 ++++++------------ .../kind/internal/install_operator.go | 7 +- tests/kubernetes-distros/kind/main_test.go | 2 +- 6 files changed, 126 insertions(+), 218 deletions(-) diff --git a/config/manager/manager.yaml b/config/manager/manager.yaml index f7a6451..a578699 100644 --- a/config/manager/manager.yaml +++ b/config/manager/manager.yaml @@ -131,6 +131,8 @@ spec: value: Kustomize - name: LUMIGO_ENDPOINT value: https://ga-otlp.lumigo-tracer-edge.golumigo.com + - name: LUMIGO_LOGS_ENDPOINT + value: https://ga-otlp.lumigo-tracer-edge.golumigo.com ports: - containerPort: 4318 name: otlphttp diff --git a/helm.yaml b/helm.yaml index 227fc8b..d5dec7c 100644 --- a/helm.yaml +++ b/helm.yaml @@ -683,6 +683,8 @@ spec: readOnlyRootFilesystem: true runAsNonRoot: true - env: + - name: LUMIGO_LOGS_ENDPOINT + value: https://ga-otlp.lumigo-tracer-edge.golumigo.com - name: LUMIGO_ENDPOINT value: https://ga-otlp.lumigo-tracer-edge.golumigo.com - mountPath: /lumigo/etc/namespaces/ diff --git a/telemetryproxy/docker/etc/config.yaml.tpl b/telemetryproxy/docker/etc/config.yaml.tpl index 9e0f64e..6e52698 100644 --- a/telemetryproxy/docker/etc/config.yaml.tpl +++ b/telemetryproxy/docker/etc/config.yaml.tpl @@ -231,6 +231,21 @@ service: exporters: {{- if $config.debug }} - logging +{{- end }} + - otlphttp/lumigo_ns_{{ $namespace.name }} + logs/application_logs_ns_{{ $namespace.name }}: + receivers: + - otlp + processors: + - k8sdataenricherprocessor + - transform/add_ns_attributes_ns_{{ $namespace.name }} +{{- if $clusterName }} + - transform/add_cluster_name +{{- end }} + - transform/inject_operator_details_into_resource + exporters: +{{- if $config.debug }} + - logging {{- end }} - otlphttp/lumigo_ns_{{ $namespace.name }} logs/k8s_objects_ns_{{ $namespace.name }}: diff --git a/telemetryproxy/src/processor/k8sdataenricherprocessor/processor.go b/telemetryproxy/src/processor/k8sdataenricherprocessor/processor.go index 41890b4..9419ba8 100644 --- a/telemetryproxy/src/processor/k8sdataenricherprocessor/processor.go +++ b/telemetryproxy/src/processor/k8sdataenricherprocessor/processor.go @@ -72,122 +72,127 @@ func (kp *kubernetesprocessor) processTraces(ctx context.Context, tr ptrace.Trac resourceSpanLength := resourceSpans.Len() for i := 0; i < resourceSpanLength; i++ { resource := resourceSpans.At(i).Resource() - resourceAttributes := resource.Attributes() - resourceAttributes.PutStr(K8SProviderIdKey, kp.kube.GetProviderId()) - resourceAttributes.PutStr(K8SClusterUIDKey, string(kp.clusterUid)) + kp.addResourceAttributes(ctx, resource) + } - pod, found := kp.getPod(ctx, &resource) - if !found { - kp.logger.Debug( - "Cannot find pod by 'k8s.pod.uid' of by connection ip", - zap.Any("resource-attributes", resourceAttributes.AsRaw()), - ) - continue - } - resourceAttributes.PutStr(K8SNodeNameKey, pod.Spec.NodeName) + return tr, nil +} - // Ensure 'k8s.pod.uid' is set (we might have found the pod via the network connection ip) - if _, found := resourceAttributes.Get(string(semconv.K8SPodUIDKey)); !found { - resourceAttributes.PutStr(string(semconv.K8SPodUIDKey), string(pod.UID)) - } +func (kp *kubernetesprocessor) addResourceAttributes(ctx context.Context, resource pcommon.Resource) { + resourceAttributes := resource.Attributes() - resourceAttributes.PutStr(string(semconv.K8SPodNameKey), pod.Name) + resourceAttributes.PutStr(K8SProviderIdKey, kp.kube.GetProviderId()) + resourceAttributes.PutStr(K8SClusterUIDKey, string(kp.clusterUid)) - resourceAttributes.PutStr(string(semconv.K8SNamespaceNameKey), pod.Namespace) - if namespace, nsFound := kp.kube.GetNamespaceByName(pod.Namespace); nsFound { - resourceAttributes.PutStr("k8s.namespace.uid", string(namespace.UID)) - } else { - kp.logger.Error( - "Cannot add namespace resource attributes to traces, namespace not found", - zap.String("namespace", pod.Namespace), - ) - } + pod, found := kp.getPod(ctx, &resource) + if !found { + kp.logger.Debug( + "Cannot find pod by 'k8s.pod.uid' of by connection ip", + zap.Any("resource-attributes", resourceAttributes.AsRaw()), + ) + return + } + resourceAttributes.PutStr(K8SNodeNameKey, pod.Spec.NodeName) - ownerObject, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, pod) - if err != nil { - kp.logger.Error( - "Cannot look up owner reference for pod", - zap.Any("pod", pod), - zap.Error(err), - ) - } + // Ensure 'k8s.pod.uid' is set (we might have found the pod via the network connection ip) + if _, found := resourceAttributes.Get(string(semconv.K8SPodUIDKey)); !found { + resourceAttributes.PutStr(string(semconv.K8SPodUIDKey), string(pod.UID)) + } - if !found { - kp.logger.Debug( - "Pod has no owner reference we can use to add other resource attributes", - zap.Any("pod", pod), - ) - continue + resourceAttributes.PutStr(string(semconv.K8SPodNameKey), pod.Name) + + resourceAttributes.PutStr(string(semconv.K8SNamespaceNameKey), pod.Namespace) + if namespace, nsFound := kp.kube.GetNamespaceByName(pod.Namespace); nsFound { + resourceAttributes.PutStr("k8s.namespace.uid", string(namespace.UID)) + } else { + kp.logger.Error( + "Cannot add namespace resource attributes to traces, namespace not found", + zap.String("namespace", pod.Namespace), + ) + } + + ownerObject, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, pod) + if err != nil { + kp.logger.Error( + "Cannot look up owner reference for pod", + zap.Any("pod", pod), + zap.Error(err), + ) + } + + if !found { + kp.logger.Debug( + "Pod has no owner reference we can use to add other resource attributes", + zap.Any("pod", pod), + ) + return + } + + switch podOwner := ownerObject.(type) { + case *appsv1.DaemonSet: + { + resourceAttributes.PutStr(string(semconv.K8SDaemonSetNameKey), podOwner.Name) + resourceAttributes.PutStr(string(semconv.K8SDaemonSetUIDKey), string(podOwner.UID)) } + case *appsv1.ReplicaSet: + { + resourceAttributes.PutStr(string(semconv.K8SReplicaSetNameKey), podOwner.Name) + resourceAttributes.PutStr(string(semconv.K8SReplicaSetUIDKey), string(podOwner.UID)) - switch podOwner := ownerObject.(type) { - case *appsv1.DaemonSet: - { - resourceAttributes.PutStr(string(semconv.K8SDaemonSetNameKey), podOwner.Name) - resourceAttributes.PutStr(string(semconv.K8SDaemonSetUIDKey), string(podOwner.UID)) - } - case *appsv1.ReplicaSet: - { - resourceAttributes.PutStr(string(semconv.K8SReplicaSetNameKey), podOwner.Name) - resourceAttributes.PutStr(string(semconv.K8SReplicaSetUIDKey), string(podOwner.UID)) - - if replicaSetOwner, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, podOwner); found { - if deployment, ok := replicaSetOwner.(*appsv1.Deployment); ok { - resourceAttributes.PutStr(string(semconv.K8SDeploymentNameKey), deployment.Name) - resourceAttributes.PutStr(string(semconv.K8SDeploymentUIDKey), string(deployment.UID)) - } else { - kp.logger.Error( - "Cannot add deployment resource attributes to traces, replicaset's owner object is not a *apps/v1.Deployment", - zap.Any("owner-object", ownerObject), - zap.Error(err), - ) - } + if replicaSetOwner, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, podOwner); found { + if deployment, ok := replicaSetOwner.(*appsv1.Deployment); ok { + resourceAttributes.PutStr(string(semconv.K8SDeploymentNameKey), deployment.Name) + resourceAttributes.PutStr(string(semconv.K8SDeploymentUIDKey), string(deployment.UID)) } else { - kp.logger.Debug( - "Cannot add deployment resource attributes to traces, replicaset has no deployment owner", - zap.Any("replicaset", podOwner), + kp.logger.Error( + "Cannot add deployment resource attributes to traces, replicaset's owner object is not a *apps/v1.Deployment", + zap.Any("owner-object", ownerObject), zap.Error(err), ) } + } else { + kp.logger.Debug( + "Cannot add deployment resource attributes to traces, replicaset has no deployment owner", + zap.Any("replicaset", podOwner), + zap.Error(err), + ) } - case *appsv1.StatefulSet: - { - resourceAttributes.PutStr(string(semconv.K8SStatefulSetNameKey), podOwner.Name) - resourceAttributes.PutStr(string(semconv.K8SStatefulSetUIDKey), string(podOwner.UID)) - } - case *batchv1.Job: - { - resourceAttributes.PutStr(string(semconv.K8SJobNameKey), podOwner.Name) - resourceAttributes.PutStr(string(semconv.K8SJobUIDKey), string(podOwner.UID)) - - if jobOwner, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, podOwner); found { - if cronJob, ok := jobOwner.(*batchv1.CronJob); ok { - resourceAttributes.PutStr(string(semconv.K8SCronJobNameKey), cronJob.Name) - resourceAttributes.PutStr(string(semconv.K8SCronJobUIDKey), string(cronJob.UID)) - } else { - kp.logger.Error( - "Cannot add cronjob resource attributes to traces, job's object is not a *batch/v1.CronJob", - zap.Any("owner-object", ownerObject), - zap.Error(err), - ) - } + } + case *appsv1.StatefulSet: + { + resourceAttributes.PutStr(string(semconv.K8SStatefulSetNameKey), podOwner.Name) + resourceAttributes.PutStr(string(semconv.K8SStatefulSetUIDKey), string(podOwner.UID)) + } + case *batchv1.Job: + { + resourceAttributes.PutStr(string(semconv.K8SJobNameKey), podOwner.Name) + resourceAttributes.PutStr(string(semconv.K8SJobUIDKey), string(podOwner.UID)) + + if jobOwner, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, podOwner); found { + if cronJob, ok := jobOwner.(*batchv1.CronJob); ok { + resourceAttributes.PutStr(string(semconv.K8SCronJobNameKey), cronJob.Name) + resourceAttributes.PutStr(string(semconv.K8SCronJobUIDKey), string(cronJob.UID)) } else { - kp.logger.Debug( - "Cannot add cronjob resource attributes to traces, job has no cronjob owner", - zap.Any("job", podOwner), + kp.logger.Error( + "Cannot add cronjob resource attributes to traces, job's object is not a *batch/v1.CronJob", + zap.Any("owner-object", ownerObject), zap.Error(err), ) } + } else { + kp.logger.Debug( + "Cannot add cronjob resource attributes to traces, job has no cronjob owner", + zap.Any("job", podOwner), + zap.Error(err), + ) } - default: - { - kp.logger.Error("Unexpected owner-object for pod", zap.Any("pod", pod), zap.Any("owner-object", ownerObject)) - } + } + default: + { + kp.logger.Error("Unexpected owner-object for pod", zap.Any("pod", pod), zap.Any("owner-object", ownerObject)) } } - - return tr, nil } func (kp *kubernetesprocessor) getPod(ctx context.Context, resource *pcommon.Resource) (*corev1.Pod, bool) { @@ -214,10 +219,7 @@ func (kp *kubernetesprocessor) processLogs(ctx context.Context, ld plog.Logs) (p for i := 0; i < resourceLogs.Len(); i++ { rl := resourceLogs.At(i) - resourceAttributes := rl.Resource().Attributes() - resourceAttributes.PutStr(K8SClusterUIDKey, string(kp.clusterUid)) - resourceAttributes.PutStr(K8SProviderIdKey, kp.kube.GetProviderId()) - + kp.addResourceAttributes(ctx, rl.Resource()); kp.processResourceLogs(ctx, &rl) } @@ -245,121 +247,7 @@ func (kp *kubernetesprocessor) processResourceLogs(ctx context.Context, resource } default: { - resource := resourceLogs.Resource() - resourceAttributes := resourceLogs.Resource().Attributes() - - resourceAttributes.PutStr(K8SProviderIdKey, kp.kube.GetProviderId()) - resourceAttributes.PutStr(K8SClusterUIDKey, string(kp.clusterUid)) - - pod, found := kp.getPod(ctx, &resource) - if !found { - kp.logger.Debug( - "Cannot find pod by 'k8s.pod.uid' of by connection ip", - zap.Any("resource-attributes", resourceAttributes.AsRaw()), - ) - continue - } - resourceAttributes.PutStr(K8SNodeNameKey, pod.Spec.NodeName) - - // Ensure 'k8s.pod.uid' is set (we might have found the pod via the network connection ip) - if _, found := resourceAttributes.Get(string(semconv.K8SPodUIDKey)); !found { - resourceAttributes.PutStr(string(semconv.K8SPodUIDKey), string(pod.UID)) - } - - resourceAttributes.PutStr(string(semconv.K8SPodNameKey), pod.Name) - - resourceAttributes.PutStr(string(semconv.K8SNamespaceNameKey), pod.Namespace) - if namespace, nsFound := kp.kube.GetNamespaceByName(pod.Namespace); nsFound { - resourceAttributes.PutStr("k8s.namespace.uid", string(namespace.UID)) - } else { - kp.logger.Error( - "Cannot add namespace resource attributes to traces, namespace not found", - zap.String("namespace", pod.Namespace), - ) - } - - ownerObject, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, pod) - if err != nil { - kp.logger.Error( - "Cannot look up owner reference for pod", - zap.Any("pod", pod), - zap.Error(err), - ) - } - - if !found { - kp.logger.Debug( - "Pod has no owner reference we can use to add other resource attributes", - zap.Any("pod", pod), - ) - continue - } - - switch podOwner := ownerObject.(type) { - case *appsv1.DaemonSet: - { - resourceAttributes.PutStr(string(semconv.K8SDaemonSetNameKey), podOwner.Name) - resourceAttributes.PutStr(string(semconv.K8SDaemonSetUIDKey), string(podOwner.UID)) - } - case *appsv1.ReplicaSet: - { - resourceAttributes.PutStr(string(semconv.K8SReplicaSetNameKey), podOwner.Name) - resourceAttributes.PutStr(string(semconv.K8SReplicaSetUIDKey), string(podOwner.UID)) - - if replicaSetOwner, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, podOwner); found { - if deployment, ok := replicaSetOwner.(*appsv1.Deployment); ok { - resourceAttributes.PutStr(string(semconv.K8SDeploymentNameKey), deployment.Name) - resourceAttributes.PutStr(string(semconv.K8SDeploymentUIDKey), string(deployment.UID)) - } else { - kp.logger.Error( - "Cannot add deployment resource attributes to traces, replicaset's owner object is not a *apps/v1.Deployment", - zap.Any("owner-object", ownerObject), - zap.Error(err), - ) - } - } else { - kp.logger.Debug( - "Cannot add deployment resource attributes to traces, replicaset has no deployment owner", - zap.Any("replicaset", podOwner), - zap.Error(err), - ) - } - } - case *appsv1.StatefulSet: - { - resourceAttributes.PutStr(string(semconv.K8SStatefulSetNameKey), podOwner.Name) - resourceAttributes.PutStr(string(semconv.K8SStatefulSetUIDKey), string(podOwner.UID)) - } - case *batchv1.Job: - { - resourceAttributes.PutStr(string(semconv.K8SJobNameKey), podOwner.Name) - resourceAttributes.PutStr(string(semconv.K8SJobUIDKey), string(podOwner.UID)) - - if jobOwner, found, err := kp.kube.ResolveRelevantOwnerReference(ctx, podOwner); found { - if cronJob, ok := jobOwner.(*batchv1.CronJob); ok { - resourceAttributes.PutStr(string(semconv.K8SCronJobNameKey), cronJob.Name) - resourceAttributes.PutStr(string(semconv.K8SCronJobUIDKey), string(cronJob.UID)) - } else { - kp.logger.Error( - "Cannot add cronjob resource attributes to traces, job's object is not a *batch/v1.CronJob", - zap.Any("owner-object", ownerObject), - zap.Error(err), - ) - } - } else { - kp.logger.Debug( - "Cannot add cronjob resource attributes to traces, job has no cronjob owner", - zap.Any("job", podOwner), - zap.Error(err), - ) - } - } - default: - { - kp.logger.Error("Unexpected owner-object for pod", zap.Any("pod", pod), zap.Any("owner-object", ownerObject)) - } - } - return + kp.logger.Error("Unexpected logs scope", zap.String("scope-name", sl.Scope().Name())) } } } diff --git a/tests/kubernetes-distros/kind/internal/install_operator.go b/tests/kubernetes-distros/kind/internal/install_operator.go index cf494ab..0df16a9 100644 --- a/tests/kubernetes-distros/kind/internal/install_operator.go +++ b/tests/kubernetes-distros/kind/internal/install_operator.go @@ -28,7 +28,7 @@ const ( DEFAULT_IMG_VERSION = "latest" ) -func installLumigoOperator(ctx context.Context, client klient.Client, kubeconfigFilePath string, lumigoNamespace string, otlpSinkUrl string, logger logr.Logger) (context.Context, error) { +func installLumigoOperator(ctx context.Context, client klient.Client, kubeconfigFilePath string, lumigoNamespace string, otlpSinkUrl string, otlpSinkLogsUrl string, logger logr.Logger) (context.Context, error) { controllerImageName, controllerImageTag := splitContainerImageNameAndTag(ctx.Value(ContextKeyOperatorControllerImage).(string)) telemetryProxyImageName, telemetryProxyImageTag := splitContainerImageNameAndTag(ctx.Value(ContextKeyOperatorTelemetryProxyImage).(string)) operatorDebug := ctx.Value(ContextKeyLumigoOperatorDebug).(bool) @@ -50,6 +50,7 @@ func installLumigoOperator(ctx context.Context, client klient.Client, kubeconfig helm.WithArgs(fmt.Sprintf("--set controllerManager.telemetryProxy.image.repository=%s", telemetryProxyImageName)), helm.WithArgs(fmt.Sprintf("--set controllerManager.telemetryProxy.image.tag=%s", telemetryProxyImageTag)), helm.WithArgs(fmt.Sprintf("--set endpoint.otlp.url=%s", otlpSinkUrl)), + helm.WithArgs(fmt.Sprintf("--set endpoint.otlp.logs.url=%s", otlpSinkUrl)), helm.WithArgs(fmt.Sprintf("--set debug.enabled=%v", operatorDebug)), // Operator debug logging at runtime helm.WithArgs("--debug"), // Helm debug output on install helm.WithWait(), @@ -70,14 +71,14 @@ func installLumigoOperator(ctx context.Context, client klient.Client, kubeconfig return ctx, nil } -func LumigoOperatorEnvFunc(lumigoNamespace string, otlpSinkUrl string, logger logr.Logger) func(ctx context.Context, cfg *envconf.Config) (context.Context, error) { +func LumigoOperatorEnvFunc(lumigoNamespace string, otlpSinkUrl string, otlpSinkLogsUrl string, logger logr.Logger) func(ctx context.Context, cfg *envconf.Config) (context.Context, error) { return func(ctx context.Context, config *envconf.Config) (context.Context, error) { client, err := config.NewClient() if err != nil { return ctx, err } - return installLumigoOperator(ctx, client, config.KubeconfigFile(), lumigoNamespace, otlpSinkUrl, logger) + return installLumigoOperator(ctx, client, config.KubeconfigFile(), lumigoNamespace, otlpSinkUrl, otlpSinkLogsUrl, logger) } } diff --git a/tests/kubernetes-distros/kind/main_test.go b/tests/kubernetes-distros/kind/main_test.go index 639af0e..f3eef20 100644 --- a/tests/kubernetes-distros/kind/main_test.go +++ b/tests/kubernetes-distros/kind/main_test.go @@ -208,7 +208,7 @@ func TestMain(m *testing.M) { logrWrapper := stdr.New(logger) otlpSinkFeature, otlpSinkK8sServiceUrl := internal.OtlpSinkEnvFunc(OTLP_SINK_NAMESPACE, "otlp-sink", OTLP_SINK_OTEL_COLLECTOR_IMAGE, logrWrapper) - lumigoOperatorFeature := internal.LumigoOperatorEnvFunc(LUMIGO_SYSTEM_NAMESPACE, otlpSinkK8sServiceUrl, logrWrapper) + lumigoOperatorFeature := internal.LumigoOperatorEnvFunc(LUMIGO_SYSTEM_NAMESPACE, otlpSinkK8sServiceUrl, otlpSinkK8sServiceUrl, logrWrapper) testEnv.Setup( internal.BuildDockerImageAndExportArchive(controllerImageName, filepath.Join(repoRoot, "controller"), controllerImageArchivePath, logger), From 381ca48463ef2c80829b317b9ce088a8c82b15d1 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Wed, 29 May 2024 13:35:33 +0300 Subject: [PATCH 06/30] Fixes --- CONTRIBUTING.md | 2 ++ .../templates/controller-deployment-and-webhooks.yaml | 2 ++ charts/lumigo-operator/values.yaml | 3 ++- controller/src/main.go | 11 ++++++----- .../kind/internal/install_operator.go | 2 +- 5 files changed, 13 insertions(+), 7 deletions(-) diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md index a9fa625..50a967f 100644 --- a/CONTRIBUTING.md +++ b/CONTRIBUTING.md @@ -111,6 +111,8 @@ spec: env: - name: LUMIGO_ENDPOINT value: \"https://my.lumigo.endpoint\" # Replace this! + - name: LUMIGO_LOGS_ENDPOINT + value: \"https://my.lumigo.endpoint\" # Replace this! " > lumigo-endpoint.patch.yaml kubectl patch --patch-file lumigo-endpoint.patch.yaml --type strategic -n lumigo-system --filename=lumigo-endpoint.patch.yaml ``` diff --git a/charts/lumigo-operator/templates/controller-deployment-and-webhooks.yaml b/charts/lumigo-operator/templates/controller-deployment-and-webhooks.yaml index c43230e..31544eb 100644 --- a/charts/lumigo-operator/templates/controller-deployment-and-webhooks.yaml +++ b/charts/lumigo-operator/templates/controller-deployment-and-webhooks.yaml @@ -231,6 +231,8 @@ spec: value: "{{ .Values.debug.enabled | default false }}" - name: LUMIGO_ENDPOINT value: "{{ .Values.endpoint.otlp.url }}" + - name: LUMIGO_LOGS_ENDPOINT + value: "{{ .Values.endpoint.otlp.logs_url }}" - name: LUMIGO_OPERATOR_VERSION value: "{{ $lumigoOperatorVersion }}" - name: LUMIGO_OPERATOR_DEPLOYMENT_METHOD diff --git a/charts/lumigo-operator/values.yaml b/charts/lumigo-operator/values.yaml index f1652c7..e7d8bd3 100644 --- a/charts/lumigo-operator/values.yaml +++ b/charts/lumigo-operator/values.yaml @@ -61,4 +61,5 @@ metricsService: type: ClusterIP endpoint: otlp: - url: https://ga-otlp.lumigo-tracer-edge.golumigo.com \ No newline at end of file + url: https://ga-otlp.lumigo-tracer-edge.golumigo.com + logs_url: https://ga-otlp.lumigo-tracer-edge.golumigo.com \ No newline at end of file diff --git a/controller/src/main.go b/controller/src/main.go index 4c4f622..5923b43 100644 --- a/controller/src/main.go +++ b/controller/src/main.go @@ -168,11 +168,12 @@ func startManager(metricsAddr string, probeAddr string, enableLeaderElection boo } if err = (&injector.LumigoInjectorWebhookHandler{ - EventRecorder: mgr.GetEventRecorderFor(fmt.Sprintf("lumigo-operator.v%s/injector-webhook", lumigoOperatorVersion)), - LumigoOperatorVersion: lumigoOperatorVersion, - LumigoInjectorImage: lumigoInjectorImage, - TelemetryProxyOtlpServiceUrl: telemetryProxyOtlpService, - Log: logger, + EventRecorder: mgr.GetEventRecorderFor(fmt.Sprintf("lumigo-operator.v%s/injector-webhook", lumigoOperatorVersion)), + LumigoOperatorVersion: lumigoOperatorVersion, + LumigoInjectorImage: lumigoInjectorImage, + TelemetryProxyOtlpServiceUrl: telemetryProxyOtlpService, + TelemetryProxyOtlpLogsServiceUrl: telemetryProxyOtlpLogsService, + Log: logger, }).SetupWebhookWithManager(mgr); err != nil { return fmt.Errorf("unable to create injector webhook: %w", err) } diff --git a/tests/kubernetes-distros/kind/internal/install_operator.go b/tests/kubernetes-distros/kind/internal/install_operator.go index 0df16a9..a202e52 100644 --- a/tests/kubernetes-distros/kind/internal/install_operator.go +++ b/tests/kubernetes-distros/kind/internal/install_operator.go @@ -50,7 +50,7 @@ func installLumigoOperator(ctx context.Context, client klient.Client, kubeconfig helm.WithArgs(fmt.Sprintf("--set controllerManager.telemetryProxy.image.repository=%s", telemetryProxyImageName)), helm.WithArgs(fmt.Sprintf("--set controllerManager.telemetryProxy.image.tag=%s", telemetryProxyImageTag)), helm.WithArgs(fmt.Sprintf("--set endpoint.otlp.url=%s", otlpSinkUrl)), - helm.WithArgs(fmt.Sprintf("--set endpoint.otlp.logs.url=%s", otlpSinkUrl)), + helm.WithArgs(fmt.Sprintf("--set endpoint.otlp.logs_url=%s", otlpSinkUrl)), helm.WithArgs(fmt.Sprintf("--set debug.enabled=%v", operatorDebug)), // Operator debug logging at runtime helm.WithArgs("--debug"), // Helm debug output on install helm.WithWait(), From 0daab4f53068ec670afa6d591e4f25d6c761a05e Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Wed, 29 May 2024 14:48:06 +0300 Subject: [PATCH 07/30] Change logs exporter --- telemetryproxy/docker/etc/config.yaml.tpl | 12 +++++++++++- 1 file changed, 11 insertions(+), 1 deletion(-) diff --git a/telemetryproxy/docker/etc/config.yaml.tpl b/telemetryproxy/docker/etc/config.yaml.tpl index 6e52698..6b61311 100644 --- a/telemetryproxy/docker/etc/config.yaml.tpl +++ b/telemetryproxy/docker/etc/config.yaml.tpl @@ -98,6 +98,16 @@ exporters: verbosity: detailed sampling_initial: 1 sampling_thereafter: 1 +{{- end }} + otlphttp/lumigo_logs: + endpoint: {{ env.Getenv "LUMIGO_LOGS_ENDPOINT" "https://ga-otlp.lumigo-tracer-edge.golumigo.com" }} + auth: + authenticator: headers_setter/lumigo +{{- if $debug }} + logging: + verbosity: detailed + sampling_initial: 1 + sampling_thereafter: 1 {{- end }} {{- range $i, $namespace := $namespaces }} otlphttp/lumigo_ns_{{ $namespace.name }}: @@ -247,7 +257,7 @@ service: {{- if $config.debug }} - logging {{- end }} - - otlphttp/lumigo_ns_{{ $namespace.name }} + - otlphttp/lumigo_logs logs/k8s_objects_ns_{{ $namespace.name }}: receivers: - k8sobjects/objects_ns_{{ $namespace.name }} From a3f801ea9d94b88c0a2be3bcec773ff8e8686145 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Wed, 29 May 2024 16:20:13 +0300 Subject: [PATCH 08/30] Remove duplicate logging section --- telemetryproxy/docker/etc/config.yaml.tpl | 6 ------ 1 file changed, 6 deletions(-) diff --git a/telemetryproxy/docker/etc/config.yaml.tpl b/telemetryproxy/docker/etc/config.yaml.tpl index 6b61311..73b6a19 100644 --- a/telemetryproxy/docker/etc/config.yaml.tpl +++ b/telemetryproxy/docker/etc/config.yaml.tpl @@ -93,12 +93,6 @@ exporters: endpoint: {{ env.Getenv "LUMIGO_ENDPOINT" "https://ga-otlp.lumigo-tracer-edge.golumigo.com" }} auth: authenticator: headers_setter/lumigo -{{- if $debug }} - logging: - verbosity: detailed - sampling_initial: 1 - sampling_thereafter: 1 -{{- end }} otlphttp/lumigo_logs: endpoint: {{ env.Getenv "LUMIGO_LOGS_ENDPOINT" "https://ga-otlp.lumigo-tracer-edge.golumigo.com" }} auth: From 7629fcf9113a804ecda965363b1c756141351956 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Wed, 29 May 2024 16:27:50 +0300 Subject: [PATCH 09/30] Remove unused test function --- .../kind/internal/install_operator.go | 18 ------------------ 1 file changed, 18 deletions(-) diff --git a/tests/kubernetes-distros/kind/internal/install_operator.go b/tests/kubernetes-distros/kind/internal/install_operator.go index a202e52..5474354 100644 --- a/tests/kubernetes-distros/kind/internal/install_operator.go +++ b/tests/kubernetes-distros/kind/internal/install_operator.go @@ -6,7 +6,6 @@ import ( "os" "path/filepath" "strings" - "testing" "time" "github.com/go-logr/logr" @@ -14,7 +13,6 @@ import ( "sigs.k8s.io/e2e-framework/klient/wait" "sigs.k8s.io/e2e-framework/klient/wait/conditions" "sigs.k8s.io/e2e-framework/pkg/envconf" - "sigs.k8s.io/e2e-framework/pkg/features" "sigs.k8s.io/e2e-framework/third_party/helm" appsv1 "k8s.io/api/apps/v1" @@ -82,22 +80,6 @@ func LumigoOperatorEnvFunc(lumigoNamespace string, otlpSinkUrl string, otlpSinkL } } -func LumigoOperatorFeature(lumigoNamespace string, otlpSinkUrl string, logger logr.Logger) features.Feature { - return features.New("LumigoOperatorLocal").Setup(func(ctx context.Context, t *testing.T, config *envconf.Config) context.Context { - client, err := config.NewClient() - if err != nil { - t.Fatal(err) - } - - ctx, err = installLumigoOperator(ctx, client, config.KubeconfigFile(), lumigoNamespace, otlpSinkUrl, logger) - if err != nil { - t.Fatal(err) - } - - return ctx - }).Feature() -} - func splitContainerImageNameAndTag(imageName string) (string, string) { lastColonIndex := strings.LastIndex(imageName, ":") lastSlashIndex := strings.LastIndex(imageName, "/") From 4a8cdedeefa8040d38df76e21a075d40c6b6582b Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 2 Jun 2024 10:46:13 +0300 Subject: [PATCH 10/30] Produce test-app logs using Winston --- tests/kubernetes-distros/kind/apps/client/app.js | 11 ++++++++--- .../kubernetes-distros/kind/apps/client/package.json | 6 ++++-- 2 files changed, 12 insertions(+), 5 deletions(-) diff --git a/tests/kubernetes-distros/kind/apps/client/app.js b/tests/kubernetes-distros/kind/apps/client/app.js index 9125008..1cd46e5 100644 --- a/tests/kubernetes-distros/kind/apps/client/app.js +++ b/tests/kubernetes-distros/kind/apps/client/app.js @@ -2,16 +2,21 @@ const axios = require('axios'); const { init } = require('@lumigo/opentelemetry'); const { SpanStatusCode, trace } = require('@opentelemetry/api'); +const winston = require('winston'); if (!process.env.TARGET_URL) { throw new Error("The required environment variable 'TARGET_URL' is not set") } -(async() => { +(async () => { const { tracerProvider } = await init; const tracer = trace.getTracer(__filename) - - await tracer.startActiveSpan('batch', async(rootSpan) => { + const logger = winston.createLogger({ + transports: [new winston.transports.Console()], + level: 'info' + }); + logger.info('Starting batch job...'); + await tracer.startActiveSpan('batch', async (rootSpan) => { try { const res = await axios.post(`${process.env.TARGET_URL}/api/checkout`, { "reference": "Order1234567", diff --git a/tests/kubernetes-distros/kind/apps/client/package.json b/tests/kubernetes-distros/kind/apps/client/package.json index 9def253..bdfb890 100644 --- a/tests/kubernetes-distros/kind/apps/client/package.json +++ b/tests/kubernetes-distros/kind/apps/client/package.json @@ -4,9 +4,11 @@ "license": "ISC", "dependencies": { "@opentelemetry/api": "^1.4.1", - "axios": "^1.1.2" + "axios": "^1.1.2", + "winston": "3.13.0", + "@opentelemetry/winston-transport": "0.3.0" }, "scripts": { "start": "node app.js" } -} +} \ No newline at end of file From bba6e6037fd07c1c64264d6f1898c3a746c70127 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 2 Jun 2024 13:15:09 +0300 Subject: [PATCH 11/30] Try activate UT --- Makefile | 2 +- controller/src/controllers/lumigo_controller_suite_test.go | 2 +- .../src/webhooks/defaulter/defaulter_webhook_suite_test.go | 6 +++--- .../src/webhooks/injector/injector_webhook_suite_test.go | 2 +- 4 files changed, 6 insertions(+), 6 deletions(-) diff --git a/Makefile b/Makefile index 1d77c76..806afb0 100644 --- a/Makefile +++ b/Makefile @@ -73,7 +73,7 @@ vet: ## Run go vet against code. .PHONY: test test: manifests generate fmt vet envtest ## Run tests. - (cd ./controller/src && KUBEBUILDER_ASSETS="$(shell $(ENVTEST) use $(ENVTEST_K8S_VERSION) --bin-dir $(LOCALBIN) -p path)" $(GOCMD) test . -coverprofile cover.out ) + (cd ./controller/src && KUBEBUILDER_ASSETS="$(shell $(ENVTEST) use $(ENVTEST_K8S_VERSION) --bin-dir $(LOCALBIN) -p path)" $(GOCMD) test ./... -failfast -coverprofile cover.out ) ##@ Build diff --git a/controller/src/controllers/lumigo_controller_suite_test.go b/controller/src/controllers/lumigo_controller_suite_test.go index 32d7b2b..4a995f9 100644 --- a/controller/src/controllers/lumigo_controller_suite_test.go +++ b/controller/src/controllers/lumigo_controller_suite_test.go @@ -81,7 +81,7 @@ var _ = BeforeSuite(func() { By("bootstrapping test environment") testEnv = &envtest.Environment{ - CRDDirectoryPaths: []string{filepath.Join("..", "config", "crd", "bases")}, + CRDDirectoryPaths: []string{filepath.Join("..", "..", "..", "config", "crd", "bases")}, ErrorIfCRDPathMissing: true, } diff --git a/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go b/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go index 5af3635..28c8782 100644 --- a/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go +++ b/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go @@ -71,10 +71,10 @@ var _ = BeforeSuite(func() { By("bootstrapping test environment") testEnv = &envtest.Environment{ - CRDDirectoryPaths: []string{filepath.Join("..", "..", "config", "crd", "bases")}, + CRDDirectoryPaths: []string{filepath.Join("..", "..", "..", "..", "..", "config", "crd", "bases")}, ErrorIfCRDPathMissing: false, WebhookInstallOptions: envtest.WebhookInstallOptions{ - Paths: []string{filepath.Join("..", "..", "config", "webhooks")}, + Paths: []string{filepath.Join("..", "..", "..", "..", "config", "webhooks")}, }, } @@ -218,7 +218,7 @@ var _ = Context("Lumigo defaulter webhook", func() { }, } - Expect(k8sClient.Create(ctx, &newLumigo)).To(Succeed()) + Expect(k8sClient.Create(ctx, &newLumigo)).To(MatchError("abc")) Expect(newLumigo.Spec.Infrastructure.Enabled).To(&beBoolPointer{expectedValue: true}) Expect(newLumigo.Spec.Infrastructure.KubeEvents.Enabled).To(&beBoolPointer{expectedValue: true}) diff --git a/controller/src/webhooks/injector/injector_webhook_suite_test.go b/controller/src/webhooks/injector/injector_webhook_suite_test.go index ef0e977..b91f37e 100644 --- a/controller/src/webhooks/injector/injector_webhook_suite_test.go +++ b/controller/src/webhooks/injector/injector_webhook_suite_test.go @@ -121,7 +121,7 @@ var _ = BeforeSuite(func() { CRDDirectoryPaths: []string{filepath.Join("..", "..", "config", "crd", "bases")}, ErrorIfCRDPathMissing: false, WebhookInstallOptions: envtest.WebhookInstallOptions{ - Paths: []string{filepath.Join("..", "..", "config", "webhooks")}, + Paths: []string{filepath.Join("..", "..", "..", "..", "config", "webhooks")}, }, } From 5ec1a130e7f5476bbc3d2f45afee724ad6052c8f Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 2 Jun 2024 14:18:15 +0300 Subject: [PATCH 12/30] Fix UT --- Makefile | 3 +-- controller/src/api/v1alpha1/lumigo_webhook_suite_test.go | 4 ++-- .../src/webhooks/defaulter/defaulter_webhook_suite_test.go | 6 +++--- .../src/webhooks/injector/injector_webhook_suite_test.go | 4 ++-- 4 files changed, 8 insertions(+), 9 deletions(-) diff --git a/Makefile b/Makefile index 806afb0..49c409c 100644 --- a/Makefile +++ b/Makefile @@ -182,8 +182,7 @@ controller-gen: $(CONTROLLER_GEN) ## Download controller-gen locally if necessar $(CONTROLLER_GEN): $(LOCALBIN) test -s $(LOCALBIN)/controller-gen || GOBIN=$(LOCALBIN) $(GOCMD) install sigs.k8s.io/controller-tools/cmd/controller-gen@$(CONTROLLER_TOOLS_VERSION) -## Pin the version of setup-envtest until https://github.com/kubernetes-sigs/controller-runtime/issues/2720 is resolved. .PHONY: envtest envtest: $(ENVTEST) ## Download envtest-setup locally if necessary. $(ENVTEST): $(LOCALBIN) - test -s $(LOCALBIN)/setup-envtest || GOBIN=$(LOCALBIN) $(GOCMD) install sigs.k8s.io/controller-runtime/tools/setup-envtest@c7e1dc9b \ No newline at end of file + test -s $(LOCALBIN)/setup-envtest || GOBIN=$(LOCALBIN) $(GOCMD) install sigs.k8s.io/controller-runtime/tools/setup-envtest \ No newline at end of file diff --git a/controller/src/api/v1alpha1/lumigo_webhook_suite_test.go b/controller/src/api/v1alpha1/lumigo_webhook_suite_test.go index 20a9749..0d07bd8 100644 --- a/controller/src/api/v1alpha1/lumigo_webhook_suite_test.go +++ b/controller/src/api/v1alpha1/lumigo_webhook_suite_test.go @@ -61,8 +61,8 @@ var _ = BeforeSuite(func() { By("bootstrapping test environment") testEnv = &envtest.Environment{ - CRDDirectoryPaths: []string{filepath.Join("..", "..", "config", "crd", "bases")}, - ErrorIfCRDPathMissing: false, + CRDDirectoryPaths: []string{filepath.Join("..", "..", "..", "..", "config", "crd", "bases")}, + ErrorIfCRDPathMissing: true, WebhookInstallOptions: envtest.WebhookInstallOptions{ Paths: []string{filepath.Join("..", "..", "config", "webhook")}, }, diff --git a/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go b/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go index 28c8782..7e3a729 100644 --- a/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go +++ b/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go @@ -71,8 +71,8 @@ var _ = BeforeSuite(func() { By("bootstrapping test environment") testEnv = &envtest.Environment{ - CRDDirectoryPaths: []string{filepath.Join("..", "..", "..", "..", "..", "config", "crd", "bases")}, - ErrorIfCRDPathMissing: false, + CRDDirectoryPaths: []string{filepath.Join("..", "..", "..", "..", "config", "crd", "bases")}, + ErrorIfCRDPathMissing: true, WebhookInstallOptions: envtest.WebhookInstallOptions{ Paths: []string{filepath.Join("..", "..", "..", "..", "config", "webhooks")}, }, @@ -218,7 +218,7 @@ var _ = Context("Lumigo defaulter webhook", func() { }, } - Expect(k8sClient.Create(ctx, &newLumigo)).To(MatchError("abc")) + Expect(k8sClient.Create(ctx, &newLumigo)).To(Succeed()) Expect(newLumigo.Spec.Infrastructure.Enabled).To(&beBoolPointer{expectedValue: true}) Expect(newLumigo.Spec.Infrastructure.KubeEvents.Enabled).To(&beBoolPointer{expectedValue: true}) diff --git a/controller/src/webhooks/injector/injector_webhook_suite_test.go b/controller/src/webhooks/injector/injector_webhook_suite_test.go index b91f37e..283bc14 100644 --- a/controller/src/webhooks/injector/injector_webhook_suite_test.go +++ b/controller/src/webhooks/injector/injector_webhook_suite_test.go @@ -118,8 +118,8 @@ var _ = BeforeSuite(func() { By("bootstrapping test environment") testEnv = &envtest.Environment{ - CRDDirectoryPaths: []string{filepath.Join("..", "..", "config", "crd", "bases")}, - ErrorIfCRDPathMissing: false, + CRDDirectoryPaths: []string{filepath.Join("..", "..", "..", "..", "config", "crd", "bases")}, + ErrorIfCRDPathMissing: true, WebhookInstallOptions: envtest.WebhookInstallOptions{ Paths: []string{filepath.Join("..", "..", "..", "..", "config", "webhooks")}, }, From 6efff14753d8055c29fa5acf2f726591f785a462 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 2 Jun 2024 16:17:55 +0300 Subject: [PATCH 13/30] Inject LUMIGO_ENABLE_LOGS --- Makefile | 2 +- controller/src/api/v1alpha1/lumigo_types.go | 9 ++++++ .../src/controllers/lumigo_controller.go | 3 +- .../lumigo_controller_suite_test.go | 32 ++++++++++--------- controller/src/mutation/matchers.go | 31 +++++++++++++++--- controller/src/mutation/mutate.go | 24 ++++++++++++-- .../webhooks/defaulter/defaulter_webhook.go | 5 +++ .../src/webhooks/injector/injector_webhook.go | 2 +- .../injector/injector_webhook_suite_test.go | 21 ++++++------ 9 files changed, 96 insertions(+), 33 deletions(-) diff --git a/Makefile b/Makefile index 49c409c..bbe4695 100644 --- a/Makefile +++ b/Makefile @@ -73,7 +73,7 @@ vet: ## Run go vet against code. .PHONY: test test: manifests generate fmt vet envtest ## Run tests. - (cd ./controller/src && KUBEBUILDER_ASSETS="$(shell $(ENVTEST) use $(ENVTEST_K8S_VERSION) --bin-dir $(LOCALBIN) -p path)" $(GOCMD) test ./... -failfast -coverprofile cover.out ) + (cd ./controller/src && KUBEBUILDER_ASSETS="$(shell $(ENVTEST) use $(ENVTEST_K8S_VERSION) --bin-dir $(LOCALBIN) -p path)" $(GOCMD) test ./... -coverprofile cover.out ) ##@ Build diff --git a/controller/src/api/v1alpha1/lumigo_types.go b/controller/src/api/v1alpha1/lumigo_types.go index 7d9b6a9..61780d1 100644 --- a/controller/src/api/v1alpha1/lumigo_types.go +++ b/controller/src/api/v1alpha1/lumigo_types.go @@ -54,6 +54,7 @@ type LumigoSpec struct { // https://docs.lumigo.io/docs/lumigo-tokens LumigoToken Credentials `json:"lumigoToken,omitempty"` Tracing TracingSpec `json:"tracing,omitempty"` + Logging LoggingSpec `json:"logging,omitempty"` Infrastructure InfrastructureSpec `json:"infrastructure,omitempty"` } @@ -77,6 +78,14 @@ type TracingSpec struct { Injection InjectionSpec `json:"injection"` } +type LoggingSpec struct { + // Whether Daemonsets, Deployments, ReplicaSets, StatefulSets, CronJobs and Jobs + // that are created or updated after the creation of the Lumigo resource have their logs sent to Lumigo. + // If unspecified, defaults to `false`. + // +kubebuilder:validation:Optional + Enabled *bool `json:"enabled"` // Using a pointer to support cases where the value is not set (and it counts as disabled) +} + type InjectionSpec struct { // Whether Daemonsets, Deployments, ReplicaSets, StatefulSets, CronJobs and Jobs // that are created or updated after the creation of the Lumigo resource be injected. diff --git a/controller/src/controllers/lumigo_controller.go b/controller/src/controllers/lumigo_controller.go index ced1b06..387cda3 100644 --- a/controller/src/controllers/lumigo_controller.go +++ b/controller/src/controllers/lumigo_controller.go @@ -490,7 +490,7 @@ func (r *LumigoReconciler) updateStatusIfNeeded(ctx context.Context, logger logr } func (r *LumigoReconciler) injectLumigoIntoResources(ctx context.Context, lumigo *operatorv1alpha1.Lumigo, log *logr.Logger) error { - mutator, err := mutation.NewMutator(log, &lumigo.Spec.LumigoToken, r.LumigoOperatorVersion, r.LumigoInjectorImage, r.TelemetryProxyOtlpServiceUrl, r.TelemetryProxyOtlpLogsServiceUrl) + mutator, err := mutation.NewMutator(log, &lumigo.Spec, r.LumigoOperatorVersion, r.LumigoInjectorImage, r.TelemetryProxyOtlpServiceUrl, r.TelemetryProxyOtlpLogsServiceUrl) if err != nil { return fmt.Errorf("cannot instantiate mutator: %w", err) } @@ -689,6 +689,7 @@ func (r *LumigoReconciler) injectLumigoIntoResources(ctx context.Context, lumigo func (r *LumigoReconciler) removeLumigoFromResources(ctx context.Context, lumigo *operatorv1alpha1.Lumigo, log *logr.Logger) error { namespace := lumigo.Namespace + mutator, err := mutation.NewMutator(log, nil, r.LumigoOperatorVersion, r.LumigoInjectorImage, r.TelemetryProxyOtlpServiceUrl, r.TelemetryProxyOtlpLogsServiceUrl) if err != nil { return fmt.Errorf("cannot instantiate mutator: %w", err) diff --git a/controller/src/controllers/lumigo_controller_suite_test.go b/controller/src/controllers/lumigo_controller_suite_test.go index 4a995f9..376a595 100644 --- a/controller/src/controllers/lumigo_controller_suite_test.go +++ b/controller/src/controllers/lumigo_controller_suite_test.go @@ -197,7 +197,6 @@ var _ = Context("Lumigo controller", func() { }) Context("with one Lumigo instance", func() { - It("has an error if the referenced secret does not exist", func() { lumigoName := "lumigo" lumigo := newLumigo(namespaceName, lumigoName, operatorv1alpha1.Credentials{ @@ -205,7 +204,7 @@ var _ = Context("Lumigo controller", func() { Name: "lumigo-credentials", Key: "token", }, - }, true, true, true) + }, true, true, true, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) By("the Lumigo instance goes in an erroneous state", func() { @@ -253,7 +252,7 @@ var _ = Context("Lumigo controller", func() { Name: "lumigo-credentials", Key: expectedTokenKey, }, - }, true, true, true) + }, true, true, true, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) By("the Lumigo instance goes in an erroneous state", func() { @@ -333,7 +332,7 @@ var _ = Context("Lumigo controller", func() { Name: "lumigo-credentials", Key: expectedTokenKey, }, - }, true, true, true) + }, true, true, true, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) By("the Lumigo instance goes in an erroneous state", func() { @@ -434,7 +433,7 @@ var _ = Context("Lumigo controller", func() { Name: lumigoSecretName, Key: expectedTokenKey, }, - }, true, false, false) + }, true, false, false, true) g.Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) }, defaultTimeout, defaultInterval).Should(Succeed()) }) @@ -453,7 +452,7 @@ var _ = Context("Lumigo controller", func() { Name: deploymentName, }, deployment)).To(Succeed()) - Expect(deployment).NotTo(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl)) + Expect(deployment).NotTo(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl, false)) }) }) @@ -517,7 +516,7 @@ var _ = Context("Lumigo controller", func() { Name: lumigoSecretName, Key: expectedTokenKey, }, - }, true, true, false) + }, true, true, false, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) Eventually(func(g Gomega) { @@ -537,7 +536,7 @@ var _ = Context("Lumigo controller", func() { Name: deploymentName, }, deployment)).To(Succeed()) - g.Expect(deployment).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl)) + g.Expect(deployment).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl, false)) g.Expect(currentVersionOf(lumigo, g)).To(BeActive()) g.Expect(currentVersionOf(lumigo, g)).To(HaveInstrumentedObjectReferenceFor(deployment)) }, defaultTimeout, defaultInterval).Should(Succeed()) @@ -565,7 +564,7 @@ var _ = Context("Lumigo controller", func() { Name: deploymentName, }, deployment)).To(Succeed()) - Expect(deployment).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl)) + Expect(deployment).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl, false)) }) }) @@ -628,7 +627,7 @@ var _ = Context("Lumigo controller", func() { Name: lumigoSecretName, Key: expectedTokenKey, }, - }, true, true, true) + }, true, true, true, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) Eventually(func(g Gomega) { @@ -644,7 +643,7 @@ var _ = Context("Lumigo controller", func() { Name: deploymentName, }, deploymentAfter)).To(Succeed()) - Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl)) + Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl, false)) }) By("Deleting the Lumigo resource", func() { @@ -710,7 +709,7 @@ var _ = Context("Lumigo controller", func() { Name: lumigoSecretName, Key: expectedTokenKey, }, - }, true, true, false) + }, true, true, false, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) Eventually(func(g Gomega) { @@ -763,7 +762,7 @@ var _ = Context("Lumigo controller", func() { }, } - lumigo1 := newLumigo(namespaceName, "lumigo1", lumigoToken, true, true, true) + lumigo1 := newLumigo(namespaceName, "lumigo1", lumigoToken, true, true, true, true) Expect(k8sClient.Create(ctx, lumigo1)).Should(Succeed()) Eventually(func(g Gomega) { g.Expect(currentVersionOf(lumigo1, g)).To(BeActive()) @@ -771,7 +770,7 @@ var _ = Context("Lumigo controller", func() { Expect(telemetryProxyNamespacesFile).To(BeMonitoringNamespace(namespaceName)) - lumigo2 := newLumigo(namespaceName, "lumigo2", lumigoToken, true, true, true) + lumigo2 := newLumigo(namespaceName, "lumigo2", lumigoToken, true, true, true, true) By("adding a second Lumigo in the namespace", func() { Expect(k8sClient.Create(ctx, lumigo2)).Should(Succeed()) @@ -803,7 +802,7 @@ var _ = Context("Lumigo controller", func() { }) -func newLumigo(namespace string, name string, lumigoToken operatorv1alpha1.Credentials, injectionEnabled bool, injectLumigoIntoExistingResourcesOnCreation bool, removeLumigoFromResourcesOnDeletion bool) *operatorv1alpha1.Lumigo { +func newLumigo(namespace string, name string, lumigoToken operatorv1alpha1.Credentials, injectionEnabled bool, injectLumigoIntoExistingResourcesOnCreation bool, removeLumigoFromResourcesOnDeletion bool, loggingEnabled bool) *operatorv1alpha1.Lumigo { return &operatorv1alpha1.Lumigo{ ObjectMeta: metav1.ObjectMeta{ Namespace: namespace, @@ -819,6 +818,9 @@ func newLumigo(namespace string, name string, lumigoToken operatorv1alpha1.Crede RemoveLumigoFromResourcesOnDeletion: &removeLumigoFromResourcesOnDeletion, }, }, + Logging: operatorv1alpha1.LoggingSpec{ + Enabled: &loggingEnabled, + }, }, } } diff --git a/controller/src/mutation/matchers.go b/controller/src/mutation/matchers.go index f8892c8..1a0c982 100644 --- a/controller/src/mutation/matchers.go +++ b/controller/src/mutation/matchers.go @@ -3,6 +3,7 @@ package mutation import ( "fmt" "reflect" + "strconv" "github.com/onsi/gomega" "github.com/onsi/gomega/format" @@ -15,16 +16,19 @@ import ( var ( errAutotraceLabelNotFound = fmt.Errorf("'%s' label not found", LumigoAutoTraceLabelKey) - errLdPreloadEnvVarNotSet = fmt.Errorf("the environment variable '%s' is not set in the container's Env", LdPreloadEnvVarName) - errLumigoTracerTokenEnvVarNotSet = fmt.Errorf("the environment variable '%s' is not set in the container's Env", LumigoTracerTokenEnvVarName) - errLumigoEndpointEnvVarNotSet = fmt.Errorf("the environment variable '%s' is not set in the container's Env", LumigoEndpointEnvVarName) + errEnvVarMissingFormat = "the environment variable '%s' is not set in the container's Env" + errLdPreloadEnvVarNotSet = fmt.Errorf(errEnvVarMissingFormat, LdPreloadEnvVarName) + errLumigoTracerTokenEnvVarNotSet = fmt.Errorf(errEnvVarMissingFormat, LumigoTracerTokenEnvVarName) + errLumigoEndpointEnvVarNotSet = fmt.Errorf(errEnvVarMissingFormat, LumigoEndpointEnvVarName) + errLumigoEnableLogsEnvVarNotSet = fmt.Errorf(errEnvVarMissingFormat, LumigoEnableLogsEnvVarName) ) -func BeInstrumentedWithLumigo(lumigoOperatorVersion string, lumigoInjectorImage string, lumigoEndpointUrl string) types.GomegaMatcher { +func BeInstrumentedWithLumigo(lumigoOperatorVersion string, lumigoInjectorImage string, lumigoEndpointUrl string, lumigoLogsEnabled bool) types.GomegaMatcher { return &beInstrumentedWithLumigo{ lumigoOperatorVersion: lumigoOperatorVersion, lumigoInjectorImage: lumigoInjectorImage, lumigoEndpointUrl: lumigoEndpointUrl, + lumigoLogsEnabled: lumigoLogsEnabled, } } @@ -32,6 +36,7 @@ type beInstrumentedWithLumigo struct { lumigoOperatorVersion string lumigoInjectorImage string lumigoEndpointUrl string + lumigoLogsEnabled bool } func (m *beInstrumentedWithLumigo) Match(actual interface{}) (bool, error) { @@ -248,6 +253,8 @@ func (m *beInstrumentedWithLumigo) isContainerInstrumentedWithLumigo(container * ldPreloadEnvVarFound := false lumigoTracerTokenEnvVarFound := false lumigoEndpointEnvVarFound := false + lumigoEnableLogsEnvVarFound := false + for _, envVar := range container.Env { switch envVar.Name { case LdPreloadEnvVarName: @@ -267,6 +274,18 @@ func (m *beInstrumentedWithLumigo) isContainerInstrumentedWithLumigo(container * return false, fmt.Errorf("unexpected value for '%s' env var: expected '%s', found '%s'", LumigoEndpointEnvVarName, m.lumigoEndpointUrl, envVar.Value) } lumigoEndpointEnvVarFound = true + + case LumigoEnableLogsEnvVarName: + boolValue, err := strconv.ParseBool(envVar.Value) + + if err != nil { + return false, fmt.Errorf("unexpected value for boolean '%s' env var: '%s'", LumigoEnableLogsEnvVarName, envVar.Value) + } + + if boolValue != m.lumigoLogsEnabled { + return false, fmt.Errorf("unexpected value for '%s' env var: expected '%t', found '%s'", LumigoEnableLogsEnvVarName, m.lumigoLogsEnabled, envVar.Value) + } + lumigoEnableLogsEnvVarFound = true } } @@ -282,6 +301,10 @@ func (m *beInstrumentedWithLumigo) isContainerInstrumentedWithLumigo(container * return false, errLumigoEndpointEnvVarNotSet } + if !lumigoEnableLogsEnvVarFound { + return false, errLumigoEnableLogsEnvVarNotSet + } + volumeMountFound := false for _, volumeMount := range container.VolumeMounts { if volumeMount.Name == LumigoInjectorVolumeName { diff --git a/controller/src/mutation/mutate.go b/controller/src/mutation/mutate.go index 94065a9..19a32fd 100644 --- a/controller/src/mutation/mutate.go +++ b/controller/src/mutation/mutate.go @@ -22,6 +22,7 @@ import ( "fmt" "reflect" + "strconv" "strings" "github.com/go-logr/logr" @@ -47,6 +48,7 @@ const LumigoInjectorVolumeMountPoint = "/opt/lumigo" const LumigoTracerTokenEnvVarName = "LUMIGO_TRACER_TOKEN" const LumigoEndpointEnvVarName = "LUMIGO_ENDPOINT" const LumigoLogsEndpointEnvVarName = "LUMIGO_LOGS_ENDPOINT" +const LumigoEnableLogsEnvVarName = "LUMIGO_ENABLE_LOGS" const LumigoContainerNameEnvVarName = "LUMIGO_CONTAINER_NAME" const LdPreloadEnvVarName = "LD_PRELOAD" const LdPreloadEnvVarValue = LumigoInjectorVolumeMountPoint + "/injector/lumigo_injector.so" @@ -80,6 +82,7 @@ type mutatorImpl struct { lumigoAutotraceLabelValue string lumigoEndpoint string lumigoLogsEndpoint string + lumigoEnableLogs bool lumigoToken *operatorv1alpha1.Credentials lumigoInjectorImage string } @@ -88,19 +91,25 @@ func (m *mutatorImpl) GetAutotraceLabelValue() string { return m.lumigoAutotraceLabelValue } -func NewMutator(Log *logr.Logger, LumigoToken *operatorv1alpha1.Credentials, LumigoOperatorVersion string, LumigoInjectorImage string, TelemetryProxyOtlpServiceUrl string, TelemetryProxyOtlpLogsServiceUrl string) (Mutator, error) { +func NewMutator(Log *logr.Logger, LumigoSpec *operatorv1alpha1.LumigoSpec, LumigoOperatorVersion string, LumigoInjectorImage string, TelemetryProxyOtlpServiceUrl string, TelemetryProxyOtlpLogsServiceUrl string) (Mutator, error) { version := LumigoOperatorVersion if len(version) > 8 { version = version[0:7] // Label values have a limit of 63 characters, we stay well below that } + lumigoEnableLogs := false + if LumigoSpec.Logging.Enabled != nil { + lumigoEnableLogs = *LumigoSpec.Logging.Enabled + } + return &mutatorImpl{ log: Log, lumigoAutotraceLabelValue: LumigoAutoTraceLabelVersionPrefixValue + version, lumigoEndpoint: TelemetryProxyOtlpServiceUrl, lumigoLogsEndpoint: TelemetryProxyOtlpLogsServiceUrl, - lumigoToken: LumigoToken, + lumigoEnableLogs: lumigoEnableLogs, + lumigoToken: &LumigoSpec.LumigoToken, lumigoInjectorImage: LumigoInjectorImage, }, nil } @@ -418,6 +427,17 @@ func (m *mutatorImpl) injectLumigoIntoPodSpec(podSpec *corev1.PodSpec) error { envVars[lumigoLogsEndpointEnvVarIndex] = *lumigoLogsEndpointEnvVar } + lumigoEnableLogsEnvVar := &corev1.EnvVar{ + Name: LumigoEnableLogsEnvVarName, + Value: strconv.FormatBool(m.lumigoEnableLogs), + } + lumigoEnableLogsEnvVarIndex := slices.IndexFunc(envVars, func(c corev1.EnvVar) bool { return c.Name == LumigoEnableLogsEnvVarName }) + if lumigoEnableLogsEnvVarIndex < 0 { + envVars = append(envVars, *lumigoEnableLogsEnvVar) + } else { + envVars[lumigoEnableLogsEnvVarIndex] = *lumigoEnableLogsEnvVar + } + lumigoContainerNameEnvVar := &corev1.EnvVar{ Name: LumigoContainerNameEnvVarName, Value: container.Name, diff --git a/controller/src/webhooks/defaulter/defaulter_webhook.go b/controller/src/webhooks/defaulter/defaulter_webhook.go index 23e1d2d..3a8b760 100644 --- a/controller/src/webhooks/defaulter/defaulter_webhook.go +++ b/controller/src/webhooks/defaulter/defaulter_webhook.go @@ -146,6 +146,11 @@ func (h *LumigoDefaulterWebhookHandler) Handle(ctx context.Context, request admi newLumigo.Spec.Infrastructure.KubeEvents.Enabled = &newTrue } + newFalse := false + if newLumigo.Spec.Logging.Enabled == nil { + newLumigo.Spec.Logging.Enabled = &newFalse + } + marshalled, err := json.Marshal(newLumigo) if err != nil { return admission.Errored(http.StatusInternalServerError, fmt.Errorf("cannot marshal object %w", err)) diff --git a/controller/src/webhooks/injector/injector_webhook.go b/controller/src/webhooks/injector/injector_webhook.go index 5a44767..47dae20 100644 --- a/controller/src/webhooks/injector/injector_webhook.go +++ b/controller/src/webhooks/injector/injector_webhook.go @@ -133,7 +133,7 @@ func (h *LumigoInjectorWebhookHandler) Handle(ctx context.Context, request admis return admission.Allowed(fmt.Sprintf("The Lumigo object in the '%s' namespace is not active; resource will not be mutated", namespace)) } - mutator, err := mutation.NewMutator(&log, &lumigo.Spec.LumigoToken, h.LumigoOperatorVersion, h.LumigoInjectorImage, h.TelemetryProxyOtlpServiceUrl, h.TelemetryProxyOtlpLogsServiceUrl) + mutator, err := mutation.NewMutator(&log, &lumigo.Spec, h.LumigoOperatorVersion, h.LumigoInjectorImage, h.TelemetryProxyOtlpServiceUrl, h.TelemetryProxyOtlpLogsServiceUrl) if err != nil { return admission.Allowed(fmt.Errorf("cannot instantiate mutator: %w", err).Error()) } diff --git a/controller/src/webhooks/injector/injector_webhook_suite_test.go b/controller/src/webhooks/injector/injector_webhook_suite_test.go index 283bc14..d9c392a 100644 --- a/controller/src/webhooks/injector/injector_webhook_suite_test.go +++ b/controller/src/webhooks/injector/injector_webhook_suite_test.go @@ -323,7 +323,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Name: "DoesNot", Key: "Exist", }, - }, true) + }, true, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) lumigo.Status = statusErroneous @@ -388,7 +388,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Name: "lumigosecret", Key: "token", }, - }, true) + }, true, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) lumigo.Status = statusActive @@ -434,7 +434,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Expect(err).NotTo(HaveOccurred()) } - Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl)) + Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl, false)) }) It("should inject a deployment with containers running not as root", func() { @@ -443,7 +443,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Name: "lumigosecret", Key: "token", }, - }, true) + }, true, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) lumigo.Status = statusActive @@ -493,7 +493,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Expect(err).NotTo(HaveOccurred()) } - Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl)) + Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl, false)) Expect(deploymentAfter.Spec.Template.Spec.InitContainers[0].SecurityContext.RunAsNonRoot).To(Equal(&f)) }) @@ -503,7 +503,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Name: "lumigosecret", Key: "token", }, - }, true) + }, true, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) lumigo.Status = statusActive @@ -564,7 +564,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Expect(err).NotTo(HaveOccurred()) } - Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl)) + Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl, false)) Expect(deploymentAfter.Spec.Template.Spec.InitContainers[0].SecurityContext.RunAsGroup).To(Equal(&group)) }) @@ -576,7 +576,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Name: "doesnot", Key: "exist", }, - }, true) + }, true, true) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) lumigo.Status = statusActive @@ -638,7 +638,7 @@ var _ = Context("Lumigo defaulter webhook", func() { }) -func newLumigo(namespace string, name string, lumigoToken operatorv1alpha1.Credentials, injectionEnabled bool) *operatorv1alpha1.Lumigo { +func newLumigo(namespace string, name string, lumigoToken operatorv1alpha1.Credentials, injectionEnabled bool, loggingEnabled bool) *operatorv1alpha1.Lumigo { return &operatorv1alpha1.Lumigo{ TypeMeta: metav1.TypeMeta{ Kind: "Lumigo", @@ -656,6 +656,9 @@ func newLumigo(namespace string, name string, lumigoToken operatorv1alpha1.Crede Enabled: &injectionEnabled, }, }, + Logging: operatorv1alpha1.LoggingSpec{ + Enabled: &loggingEnabled, + }, }, } } From 5be719bc902c6b069b631dd0c975c44467611b45 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 2 Jun 2024 17:24:04 +0300 Subject: [PATCH 14/30] Inject LUMIGO_ENABLE_LOGS - tests --- config/crd/bases/operator.lumigo.io_lumigoes.yaml | 11 +++++++++++ .../src/controllers/lumigo_controller_suite_test.go | 4 ++-- controller/src/mutation/mutate.go | 9 +++++++-- .../defaulter/defaulter_webhook_suite_test.go | 3 ++- .../webhooks/injector/injector_webhook_suite_test.go | 6 +++--- 5 files changed, 25 insertions(+), 8 deletions(-) diff --git a/config/crd/bases/operator.lumigo.io_lumigoes.yaml b/config/crd/bases/operator.lumigo.io_lumigoes.yaml index a76d1c7..88ca1dc 100644 --- a/config/crd/bases/operator.lumigo.io_lumigoes.yaml +++ b/config/crd/bases/operator.lumigo.io_lumigoes.yaml @@ -102,6 +102,17 @@ spec: required: - injection type: object + logging: + description: 'LoggingSpec specifies if logging should be set up by the operator' + properties: + enabled: + description: Whether Daemonsets, Deployments, ReplicaSets, + StatefulSets, CronJobs and Jobs that are created or updated + after the creation of the Lumigo resource and are injected will + have their logs sent to Lumigo. + If unspecified, defaults to `false` + type: boolean + type: object type: object status: description: LumigoStatus defines the observed state of Lumigo diff --git a/controller/src/controllers/lumigo_controller_suite_test.go b/controller/src/controllers/lumigo_controller_suite_test.go index 376a595..c913e12 100644 --- a/controller/src/controllers/lumigo_controller_suite_test.go +++ b/controller/src/controllers/lumigo_controller_suite_test.go @@ -516,7 +516,7 @@ var _ = Context("Lumigo controller", func() { Name: lumigoSecretName, Key: expectedTokenKey, }, - }, true, true, false, true) + }, true, true, false, false) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) Eventually(func(g Gomega) { @@ -627,7 +627,7 @@ var _ = Context("Lumigo controller", func() { Name: lumigoSecretName, Key: expectedTokenKey, }, - }, true, true, true, true) + }, true, true, true, false) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) Eventually(func(g Gomega) { diff --git a/controller/src/mutation/mutate.go b/controller/src/mutation/mutate.go index 19a32fd..ece0c70 100644 --- a/controller/src/mutation/mutate.go +++ b/controller/src/mutation/mutate.go @@ -99,17 +99,22 @@ func NewMutator(Log *logr.Logger, LumigoSpec *operatorv1alpha1.LumigoSpec, Lumig } lumigoEnableLogs := false - if LumigoSpec.Logging.Enabled != nil { + if LumigoSpec != nil && LumigoSpec.Logging.Enabled != nil { lumigoEnableLogs = *LumigoSpec.Logging.Enabled } + lumigoToken := &operatorv1alpha1.Credentials{} + if LumigoSpec != nil { + lumigoToken = &LumigoSpec.LumigoToken + } + return &mutatorImpl{ log: Log, lumigoAutotraceLabelValue: LumigoAutoTraceLabelVersionPrefixValue + version, lumigoEndpoint: TelemetryProxyOtlpServiceUrl, lumigoLogsEndpoint: TelemetryProxyOtlpLogsServiceUrl, lumigoEnableLogs: lumigoEnableLogs, - lumigoToken: &LumigoSpec.LumigoToken, + lumigoToken: lumigoToken, lumigoInjectorImage: LumigoInjectorImage, }, nil } diff --git a/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go b/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go index 7e3a729..c89008b 100644 --- a/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go +++ b/controller/src/webhooks/defaulter/defaulter_webhook_suite_test.go @@ -197,7 +197,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Context("when creating the first Lumigo instance in the namespace", func() { - It("it sets defaults for Tracing.Injection.*", func() { + It("it sets defaults for Tracing.Injection.* and Logging", func() { newLumigo := operatorv1alpha1.Lumigo{ TypeMeta: metav1.TypeMeta{ Kind: "Lumigo", @@ -225,6 +225,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Expect(newLumigo.Spec.Tracing.Injection.Enabled).To(&beBoolPointer{expectedValue: true}) Expect(newLumigo.Spec.Tracing.Injection.InjectLumigoIntoExistingResourcesOnCreation).To(&beBoolPointer{expectedValue: true}) Expect(newLumigo.Spec.Tracing.Injection.RemoveLumigoFromResourcesOnDeletion).To(&beBoolPointer{expectedValue: true}) + Expect(newLumigo.Spec.Logging.Enabled).To(&beBoolPointer{expectedValue: false}) }) It("it rejects instances with blank .LumigoToken.Spec.LumigoToken.SecretRef.Name", func() { diff --git a/controller/src/webhooks/injector/injector_webhook_suite_test.go b/controller/src/webhooks/injector/injector_webhook_suite_test.go index d9c392a..198f875 100644 --- a/controller/src/webhooks/injector/injector_webhook_suite_test.go +++ b/controller/src/webhooks/injector/injector_webhook_suite_test.go @@ -434,7 +434,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Expect(err).NotTo(HaveOccurred()) } - Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl, false)) + Expect(deploymentAfter).To(mutation.BeInstrumentedWithLumigo(lumigoOperatorVersion, lumigoInjectorImage, telemetryProxyOtlpServiceUrl, true)) }) It("should inject a deployment with containers running not as root", func() { @@ -443,7 +443,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Name: "lumigosecret", Key: "token", }, - }, true, true) + }, true, false) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) lumigo.Status = statusActive @@ -503,7 +503,7 @@ var _ = Context("Lumigo defaulter webhook", func() { Name: "lumigosecret", Key: "token", }, - }, true, true) + }, true, false) Expect(k8sClient.Create(ctx, lumigo)).Should(Succeed()) lumigo.Status = statusActive From ec1982f745cbe91f96e3ed9a4f527b5bb08b3c15 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 2 Jun 2024 17:26:50 +0300 Subject: [PATCH 15/30] Revert envtest version un-pinning --- Makefile | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/Makefile b/Makefile index bbe4695..e5a027e 100644 --- a/Makefile +++ b/Makefile @@ -182,7 +182,8 @@ controller-gen: $(CONTROLLER_GEN) ## Download controller-gen locally if necessar $(CONTROLLER_GEN): $(LOCALBIN) test -s $(LOCALBIN)/controller-gen || GOBIN=$(LOCALBIN) $(GOCMD) install sigs.k8s.io/controller-tools/cmd/controller-gen@$(CONTROLLER_TOOLS_VERSION) +## Pin the version of setup-envtest until https://github.com/kubernetes-sigs/controller-runtime/issues/2720 is resolved. .PHONY: envtest envtest: $(ENVTEST) ## Download envtest-setup locally if necessary. $(ENVTEST): $(LOCALBIN) - test -s $(LOCALBIN)/setup-envtest || GOBIN=$(LOCALBIN) $(GOCMD) install sigs.k8s.io/controller-runtime/tools/setup-envtest \ No newline at end of file + test -s $(LOCALBIN)/setup-envtest || GOBIN=$(LOCALBIN) $(GOCMD) install sigs.k8s.io/controller-runtime/tools/setup-envtest@c7e1dc9b \ No newline at end of file From 0f5ea9fbdad3d9d791dcb6bcf0312eb5d98574e8 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Mon, 3 Jun 2024 08:25:00 +0300 Subject: [PATCH 16/30] Update readme [skip-ci] --- README.md | 24 ++++++++++++++++++++++-- 1 file changed, 22 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index 49a430a..4fef142 100644 --- a/README.md +++ b/README.md @@ -72,9 +72,9 @@ The Lumigo Kubernetes operator allows you to set a human-readable name using the You can check which version of the Lumigo Kubernetes operator you have deployed in your cluster as follows: ```sh -$ helm ls -A +$ helm ls -A NAME NAMESPACE REVISION UPDATED STATUS CHART APP VERSION -lumigo lumigo-system 2 2023-07-10 09:20:04.233825 +0200 CEST deployed lumigo-operator-13 13 +lumigo lumigo-system 2 2023-07-10 09:20:04.233825 +0200 CEST deployed lumigo-operator-13 13 ``` The Lumigo Kubernetes operator is reported as `APP VERSION`. @@ -160,6 +160,26 @@ Status: UID: 93d6d809-ac2a-43a9-bc07-f0d4e314efcc ``` +#### Logging support + +The Lumigo Kubernetes operator can automatically forward logs emitted by traced pods to [Lumigo's log-management solution](https://lumigo.io/lp/log-management/), supporting several logging providers (currently `logging` for Python apps, `Winston` and `Bunyan` for Node.js apps). +Enabling log forwarding is done by adding the `spec.logging.enabled` field to the `Lumigo` resource: + +```yaml +apiVersion: operator.lumigo.io/v1alpha1 +kind: Lumigo +metadata: + labels: + app.kubernetes.io/name: lumigo + app.kubernetes.io/instance: lumigo + app.kubernetes.io/part-of: lumigo-operator + name: lumigo +spec: + lumigoToken: ... # same token used for tracing + logging: + enabled: true # enables log forwarding for pods with tracing injected +``` + #### Opting out for specific resources To prevent the Lumigo Kubernetes operator from injecting tracing to pods managed by some resource in a namespace that contains a `Lumigo` resource, add the `lumigo.auto-trace` label set to `false`: From e5d57824ad1da2791f9550a48e68f70a02023c07 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Mon, 3 Jun 2024 10:58:33 +0300 Subject: [PATCH 17/30] Fix docs --- CONTRIBUTING.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md index 50a967f..3462d04 100644 --- a/CONTRIBUTING.md +++ b/CONTRIBUTING.md @@ -102,7 +102,7 @@ Changing the target Lumigo backend can be done with a [`patchStrategicMerge`](ht echo -n "apiVersion: apps/v1 kind: Deployment metadata: - name: lumigo-lumigo-controller-manager + name: lumigo-lumigo-operator-controller-manager spec: template: spec: From f1d5d750dc0bdbe81b6612e93e8eef4b5b190cb5 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Mon, 3 Jun 2024 10:58:41 +0300 Subject: [PATCH 18/30] Add the logging to the specs --- charts/lumigo-operator/templates/lumigo-crd.yaml | 11 +++++++++++ helm.yaml | 11 +++++++++++ kustomize.yaml | 11 +++++++++++ 3 files changed, 33 insertions(+) diff --git a/charts/lumigo-operator/templates/lumigo-crd.yaml b/charts/lumigo-operator/templates/lumigo-crd.yaml index 7657eef..4b1cbf1 100644 --- a/charts/lumigo-operator/templates/lumigo-crd.yaml +++ b/charts/lumigo-operator/templates/lumigo-crd.yaml @@ -102,6 +102,17 @@ spec: required: - injection type: object + logging: + description: 'LoggingSpec specifies if logging should be set up by the operator' + properties: + enabled: + description: Whether Daemonsets, Deployments, ReplicaSets, + StatefulSets, CronJobs and Jobs that are created or updated + after the creation of the Lumigo resource and are injected will + have their logs sent to Lumigo. + If unspecified, defaults to `false` + type: boolean + type: object type: object status: description: LumigoStatus defines the observed state of Lumigo diff --git a/helm.yaml b/helm.yaml index d5dec7c..c56e4e7 100644 --- a/helm.yaml +++ b/helm.yaml @@ -153,6 +153,17 @@ spec: required: - injection type: object + logging: + description: 'LoggingSpec specifies if logging should be set up by the operator' + properties: + enabled: + description: Whether Daemonsets, Deployments, ReplicaSets, + StatefulSets, CronJobs and Jobs that are created or updated + after the creation of the Lumigo resource and are injected will + have their logs sent to Lumigo. + If unspecified, defaults to `false` + type: boolean + type: object type: object status: description: LumigoStatus defines the observed state of Lumigo diff --git a/kustomize.yaml b/kustomize.yaml index 15fd8b6..f4f4296 100644 --- a/kustomize.yaml +++ b/kustomize.yaml @@ -96,6 +96,17 @@ spec: required: - injection type: object + logging: + description: 'LoggingSpec specifies if logging should be set up by the operator' + properties: + enabled: + description: Whether Daemonsets, Deployments, ReplicaSets, + StatefulSets, CronJobs and Jobs that are created or updated + after the creation of the Lumigo resource and are injected will + have their logs sent to Lumigo. + If unspecified, defaults to `false` + type: boolean + type: object type: object status: description: LumigoStatus defines the observed state of Lumigo From e0808af603e2071ac8c9f586f9a9a589aa51b1be Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Mon, 3 Jun 2024 11:49:48 +0300 Subject: [PATCH 19/30] Test application logs --- .../kind/internal/lumigo.go | 5 ++++- .../kind/lumigooperator_logs_test.go | 21 +++++++++++++++++-- .../kind/lumigooperator_traces_test.go | 2 +- 3 files changed, 24 insertions(+), 4 deletions(-) diff --git a/tests/kubernetes-distros/kind/internal/lumigo.go b/tests/kubernetes-distros/kind/internal/lumigo.go index 71ef0b6..b5b16ec 100644 --- a/tests/kubernetes-distros/kind/internal/lumigo.go +++ b/tests/kubernetes-distros/kind/internal/lumigo.go @@ -5,7 +5,7 @@ import ( metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" ) -func NewLumigo(namespace, name, lumigoTokenSecretName, lumigoTokenSecretKey string, injectionEnabled bool) *operatorv1alpha1.Lumigo { +func NewLumigo(namespace, name, lumigoTokenSecretName, lumigoTokenSecretKey string, injectionEnabled bool, enableLogs bool) *operatorv1alpha1.Lumigo { return &operatorv1alpha1.Lumigo{ ObjectMeta: metav1.ObjectMeta{ Namespace: namespace, @@ -24,6 +24,9 @@ func NewLumigo(namespace, name, lumigoTokenSecretName, lumigoTokenSecretKey stri Enabled: &injectionEnabled, }, }, + Logging: operatorv1alpha1.LoggingSpec{ + Enabled: &enableLogs, + }, }, } } diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index 8c4d9ec..ee56e25 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -42,7 +42,7 @@ var ( // 2. A Lumigo operator installed into the Kubernetes cluster referenced by the // `kubectl` configuration -func TestLumigoOperatorEventsAndObjects(t *testing.T) { +func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { logger := testr.New(t) testAppDeploymentFeature := features.New("TestApp"). @@ -77,7 +77,7 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { t.Fatal(err) } - lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true) + lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true, true) r, err := resources.New(client.RESTConfig()) if err != nil { @@ -352,6 +352,8 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { t.Fatalf("No log data found in '%s'", logsPath) } + foundApplicationLogs := false + /* * Logs come in multiple lines, and two different scopes; we need to split by '\n'. * bufio.NewScanner fails because our lines are "too long" (LOL). @@ -364,6 +366,17 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { l := exportRequest.Logs().ResourceLogs().Len() for i := 0; i < l; i++ { resourceLogs := exportRequest.Logs().ResourceLogs().At(i) + + for j := 0; j < resourceLogs.ScopeLogs().Len(); j++ { + scopeLogs := resourceLogs.ScopeLogs().At(j) + + // Make sure that applications logs are exported as well, + // and not only the operator built-in logs for events and objects + if scopeLogs.Scope().Name() == "@opentelemetry/winston-transport" { + foundApplicationLogs = true + } + } + resourceAttributes := resourceLogs.Resource().Attributes().AsRaw() if actualClusterName, found := resourceAttributes["k8s.cluster.name"]; !found { @@ -378,6 +391,10 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { t.Fatalf("wrong 'k8s.cluster.uid' value found: '%s'; expected: '%s'; %+v", actualClusterUID, expectedClusterUID, resourceAttributes) } } + + if !foundApplicationLogs { + t.Fatalf("No application logs were found in the logs. Make sure that the test-application uses Winston for logging and has @opentelemetry/winston-transport as a dependency") + } } return ctx diff --git a/tests/kubernetes-distros/kind/lumigooperator_traces_test.go b/tests/kubernetes-distros/kind/lumigooperator_traces_test.go index 610915e..517e107 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_traces_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_traces_test.go @@ -76,7 +76,7 @@ func TestLumigoOperatorTraces(t *testing.T) { t.Fatal(err) } - lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true) + lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true, false) r, err := resources.New(client.RESTConfig()) if err != nil { From 79f13d74dac11c00ec53c511d893bbff6312ab30 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Mon, 3 Jun 2024 12:30:25 +0300 Subject: [PATCH 20/30] Try fix test --- tests/kubernetes-distros/kind/lumigooperator_logs_test.go | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index ee56e25..b9a2a8c 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -391,10 +391,10 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { t.Fatalf("wrong 'k8s.cluster.uid' value found: '%s'; expected: '%s'; %+v", actualClusterUID, expectedClusterUID, resourceAttributes) } } + } - if !foundApplicationLogs { - t.Fatalf("No application logs were found in the logs. Make sure that the test-application uses Winston for logging and has @opentelemetry/winston-transport as a dependency") - } + if !foundApplicationLogs { + t.Fatalf("No application logs were found in the logs. Make sure that the test-application uses Winston for logging and has @opentelemetry/winston-transport as a dependency") } return ctx From e6e9c149a313458e3c1372c5ebce7c115ae4de44 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Mon, 3 Jun 2024 13:58:51 +0300 Subject: [PATCH 21/30] Move to the correct test suite --- tests/kubernetes-distros/kind/apps/client/app.js | 6 ------ tests/kubernetes-distros/kind/lumigooperator_logs_test.go | 8 +++++++- 2 files changed, 7 insertions(+), 7 deletions(-) diff --git a/tests/kubernetes-distros/kind/apps/client/app.js b/tests/kubernetes-distros/kind/apps/client/app.js index 1cd46e5..f428bd6 100644 --- a/tests/kubernetes-distros/kind/apps/client/app.js +++ b/tests/kubernetes-distros/kind/apps/client/app.js @@ -2,7 +2,6 @@ const axios = require('axios'); const { init } = require('@lumigo/opentelemetry'); const { SpanStatusCode, trace } = require('@opentelemetry/api'); -const winston = require('winston'); if (!process.env.TARGET_URL) { throw new Error("The required environment variable 'TARGET_URL' is not set") @@ -11,11 +10,6 @@ if (!process.env.TARGET_URL) { (async () => { const { tracerProvider } = await init; const tracer = trace.getTracer(__filename) - const logger = winston.createLogger({ - transports: [new winston.transports.Console()], - level: 'info' - }); - logger.info('Starting batch job...'); await tracer.startActiveSpan('batch', async (rootSpan) => { try { const res = await axios.post(`${process.env.TARGET_URL}/api/checkout`, { diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index b9a2a8c..3b34d4e 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -125,7 +125,13 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { { Name: "myapp", Image: testImage, - Command: []string{"python", "-c", fmt.Sprintf("while True: print(\"%s\"); import time; time.sleep(5)", logOutput)}, + Command: []string{"python", "-c", fmt.Sprintf(` + import logging + import time + while True: + logging.getLogger(__name__).info('%s') + time.sleep(5) + `, logOutput)}, }, }, }, From 846df94570c12dc907f17524181d906fa10ae2de Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Mon, 3 Jun 2024 15:41:50 +0300 Subject: [PATCH 22/30] Try fix test --- tests/kubernetes-distros/kind/lumigooperator_logs_test.go | 8 +------- 1 file changed, 1 insertion(+), 7 deletions(-) diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index 3b34d4e..eabbb0c 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -125,13 +125,7 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { { Name: "myapp", Image: testImage, - Command: []string{"python", "-c", fmt.Sprintf(` - import logging - import time - while True: - logging.getLogger(__name__).info('%s') - time.sleep(5) - `, logOutput)}, + Command: []string{"python", "-c", fmt.Sprintf("while True: import time; import logging; logging.getLogger('test').warning('%s'); time.sleep(5)", logOutput)}, }, }, }, From 3138cd829c0576fdd1851b5546558c5f9abfd247 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Tue, 4 Jun 2024 11:16:54 +0300 Subject: [PATCH 23/30] Try python logging --- tests/kubernetes-distros/kind/apps/python/Dockerfile | 9 +++++++++ tests/kubernetes-distros/kind/apps/python/app.py | 10 ++++++++++ .../kind/internal/build_docker_image.go | 1 + tests/kubernetes-distros/kind/internal/context.go | 1 + .../kind/lumigooperator_logs_test.go | 11 +++++------ tests/kubernetes-distros/kind/main_test.go | 7 +++++++ .../kind/resources/kind-config.yaml.tpl | 8 +++++++- 7 files changed, 40 insertions(+), 7 deletions(-) create mode 100644 tests/kubernetes-distros/kind/apps/python/Dockerfile create mode 100644 tests/kubernetes-distros/kind/apps/python/app.py diff --git a/tests/kubernetes-distros/kind/apps/python/Dockerfile b/tests/kubernetes-distros/kind/apps/python/Dockerfile new file mode 100644 index 0000000..c9698b1 --- /dev/null +++ b/tests/kubernetes-distros/kind/apps/python/Dockerfile @@ -0,0 +1,9 @@ +FROM python:3.11-slim + +WORKDIR /code + +COPY ./app.py /code/app.py + +LABEL distro-version='DEV' + +ENTRYPOINT [] \ No newline at end of file diff --git a/tests/kubernetes-distros/kind/apps/python/app.py b/tests/kubernetes-distros/kind/apps/python/app.py new file mode 100644 index 0000000..4484a0f --- /dev/null +++ b/tests/kubernetes-distros/kind/apps/python/app.py @@ -0,0 +1,10 @@ +import sys +import time +import logging + +logger = logging.getLogger("test") +logger.setLevel(logging.DEBUG) + +while True: + logger.info(sys.argv[1]) + time.sleep(5) \ No newline at end of file diff --git a/tests/kubernetes-distros/kind/internal/build_docker_image.go b/tests/kubernetes-distros/kind/internal/build_docker_image.go index b62fc8c..da41c30 100644 --- a/tests/kubernetes-distros/kind/internal/build_docker_image.go +++ b/tests/kubernetes-distros/kind/internal/build_docker_image.go @@ -17,6 +17,7 @@ import ( const ( DEFAULT_JS_CLIENT_IMG_NAME = "host.docker.internal:5000/test-apps/js/client" DEFAULT_JS_SERVER_IMG_NAME = "host.docker.internal:5000/test-apps/js/server" + DEFAULT_PYTHON_IMG_NAME = "host.docker.internal:5000/test-apps/python-app" ) func BuildDockerImageAndExportArchive(imageName, sourceFolder, imageArchivePath string, logger *log.Logger) env.Func { diff --git a/tests/kubernetes-distros/kind/internal/context.go b/tests/kubernetes-distros/kind/internal/context.go index c4c21c1..447ef9c 100644 --- a/tests/kubernetes-distros/kind/internal/context.go +++ b/tests/kubernetes-distros/kind/internal/context.go @@ -15,6 +15,7 @@ var ( ContextKeySendDataToLumigo = ContextKey("lumigo/upstream/send_data") ContextTestAppJsClientImageName = ContextKey("test-apps/js/client/image/name") ContextTestAppJsServerImageName = ContextKey("test-apps/js/server/image/name") + ContextTestAppPythonImageName = ContextKey("test-apps/python/image/name") ) func (c ContextKey) String() string { diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index eabbb0c..7ba48c6 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -87,8 +87,7 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { r.Create(ctx, lumigo) deploymentName := "testdeployment" - testImage := "python" - logOutput := "IT'S ALIIIIIIVE!" + logOutput := "I AM ALIIIIIIVE!" tr := true var g int64 = 5678 @@ -124,8 +123,8 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { Containers: []corev1.Container{ { Name: "myapp", - Image: testImage, - Command: []string{"python", "-c", fmt.Sprintf("while True: import time; import logging; logging.getLogger('test').warning('%s'); time.sleep(5)", logOutput)}, + Image: ctx.Value(internal.ContextTestAppPythonImageName).(string), + Command: []string{"python", "app.py", logOutput}, }, }, }, @@ -372,7 +371,7 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { // Make sure that applications logs are exported as well, // and not only the operator built-in logs for events and objects - if scopeLogs.Scope().Name() == "@opentelemetry/winston-transport" { + if !strings.Contains(scopeLogs.Scope().Name(), "lumigo") { foundApplicationLogs = true } } @@ -394,7 +393,7 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { } if !foundApplicationLogs { - t.Fatalf("No application logs were found in the logs. Make sure that the test-application uses Winston for logging and has @opentelemetry/winston-transport as a dependency") + t.Fatalf("No application logs were found in the logs. Make sure that the test-application logs are emitted by checking %s", logsPath) } return ctx diff --git a/tests/kubernetes-distros/kind/main_test.go b/tests/kubernetes-distros/kind/main_test.go index f3eef20..6e63de8 100644 --- a/tests/kubernetes-distros/kind/main_test.go +++ b/tests/kubernetes-distros/kind/main_test.go @@ -191,6 +191,9 @@ func TestMain(m *testing.M) { testJsServerImageName := fmt.Sprintf("%s:%s", internal.DEFAULT_JS_SERVER_IMG_NAME, runId) testJsServerImageArchivePath := filepath.Join(tmpDir, "test-js-server.tgz") + testPythonImageName := fmt.Sprintf("%s:%s", internal.DEFAULT_PYTHON_IMG_NAME, runId) + testPythonImageArchivePath := filepath.Join(tmpDir, "test-python.tgz") + ctx := context.WithValue(context.Background(), internal.ContextKeyRunId, runId) ctx = context.WithValue(ctx, internal.ContextKeyKubernetesClusterName, kindClusterName) ctx = context.WithValue(ctx, internal.ContextKeyOtlpSinkConfigPath, dataSinkConfigDir) @@ -203,6 +206,7 @@ func TestMain(m *testing.M) { ctx = context.WithValue(ctx, internal.ContextKeyOperatorTelemetryProxyImage, telemetryProxyImageName) ctx = context.WithValue(ctx, internal.ContextTestAppJsClientImageName, testJsClientImageName) ctx = context.WithValue(ctx, internal.ContextTestAppJsServerImageName, testJsServerImageName) + ctx = context.WithValue(ctx, internal.ContextTestAppPythonImageName, testPythonImageName) testEnv = env.NewWithConfig(cfg).WithContext(ctx) @@ -215,6 +219,7 @@ func TestMain(m *testing.M) { internal.BuildDockerImageAndExportArchive(telemetryProxyImageName, filepath.Join(repoRoot, "telemetryproxy"), telemetryProxyImageArchivePath, logger), internal.BuildDockerImageAndExportArchive(testJsClientImageName, filepath.Join(cwd, "apps", "client"), testJsClientImageArchivePath, logger), internal.BuildDockerImageAndExportArchive(testJsServerImageName, filepath.Join(cwd, "apps", "server"), testJsServerImageArchivePath, logger), + internal.BuildDockerImageAndExportArchive(testPythonImageName, filepath.Join(cwd, "apps", "python"), testPythonImageArchivePath, logger), envfuncs.CreateKindClusterWithConfig(kindClusterName, kindNodeImageVal, kindConfigPath), @@ -222,6 +227,8 @@ func TestMain(m *testing.M) { internal.LoadDockerImageArchiveToCluster(kindClusterName, telemetryProxyImageArchivePath, logger), internal.LoadDockerImageArchiveToCluster(kindClusterName, testJsClientImageArchivePath, logger), internal.LoadDockerImageArchiveToCluster(kindClusterName, testJsServerImageArchivePath, logger), + internal.LoadDockerImageArchiveToCluster(kindClusterName, testPythonImageArchivePath, logger), + /* * Otel Collector image is on Docker hub, no need to pull it into Kind (pulling into Kind * works only for local image, in the local Docker daemon). diff --git a/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl b/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl index fa5aac3..2e88f9d 100644 --- a/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl +++ b/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl @@ -6,4 +6,10 @@ nodes: - hostPath: '{{OTLP_SINK_CONFIG_VOLUME_PATH}}' containerPath: /lumigo/otlp-sink/config - hostPath: '{{OTLP_SINK_DATA_VOLUME_PATH}}' - containerPath: /lumigo/otlp-sink/data \ No newline at end of file + containerPath: /lumigo/otlp-sink/data + kubeadmConfigPatches: + - | + kind: InitConfiguration + nodeRegistration: + kubeletExtraArgs: + system-reserved: memory=4Gi \ No newline at end of file From c2d48cd757e5c3958518896145996109373ead60 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Tue, 4 Jun 2024 11:38:06 +0300 Subject: [PATCH 24/30] Remove log testing --- .../kind/apps/client/app.js | 6 ++++ .../kind/apps/python/Dockerfile | 9 ------ .../kind/apps/python/app.py | 10 ------- .../kind/internal/build_docker_image.go | 1 - .../kind/internal/context.go | 1 - .../kind/internal/lumigo.go | 5 +--- .../kind/lumigooperator_logs_test.go | 28 ++++--------------- .../kind/lumigooperator_traces_test.go | 2 +- tests/kubernetes-distros/kind/main_test.go | 7 ----- .../kind/resources/kind-config.yaml.tpl | 8 +----- 10 files changed, 15 insertions(+), 62 deletions(-) delete mode 100644 tests/kubernetes-distros/kind/apps/python/Dockerfile delete mode 100644 tests/kubernetes-distros/kind/apps/python/app.py diff --git a/tests/kubernetes-distros/kind/apps/client/app.js b/tests/kubernetes-distros/kind/apps/client/app.js index f428bd6..1cd46e5 100644 --- a/tests/kubernetes-distros/kind/apps/client/app.js +++ b/tests/kubernetes-distros/kind/apps/client/app.js @@ -2,6 +2,7 @@ const axios = require('axios'); const { init } = require('@lumigo/opentelemetry'); const { SpanStatusCode, trace } = require('@opentelemetry/api'); +const winston = require('winston'); if (!process.env.TARGET_URL) { throw new Error("The required environment variable 'TARGET_URL' is not set") @@ -10,6 +11,11 @@ if (!process.env.TARGET_URL) { (async () => { const { tracerProvider } = await init; const tracer = trace.getTracer(__filename) + const logger = winston.createLogger({ + transports: [new winston.transports.Console()], + level: 'info' + }); + logger.info('Starting batch job...'); await tracer.startActiveSpan('batch', async (rootSpan) => { try { const res = await axios.post(`${process.env.TARGET_URL}/api/checkout`, { diff --git a/tests/kubernetes-distros/kind/apps/python/Dockerfile b/tests/kubernetes-distros/kind/apps/python/Dockerfile deleted file mode 100644 index c9698b1..0000000 --- a/tests/kubernetes-distros/kind/apps/python/Dockerfile +++ /dev/null @@ -1,9 +0,0 @@ -FROM python:3.11-slim - -WORKDIR /code - -COPY ./app.py /code/app.py - -LABEL distro-version='DEV' - -ENTRYPOINT [] \ No newline at end of file diff --git a/tests/kubernetes-distros/kind/apps/python/app.py b/tests/kubernetes-distros/kind/apps/python/app.py deleted file mode 100644 index 4484a0f..0000000 --- a/tests/kubernetes-distros/kind/apps/python/app.py +++ /dev/null @@ -1,10 +0,0 @@ -import sys -import time -import logging - -logger = logging.getLogger("test") -logger.setLevel(logging.DEBUG) - -while True: - logger.info(sys.argv[1]) - time.sleep(5) \ No newline at end of file diff --git a/tests/kubernetes-distros/kind/internal/build_docker_image.go b/tests/kubernetes-distros/kind/internal/build_docker_image.go index da41c30..b62fc8c 100644 --- a/tests/kubernetes-distros/kind/internal/build_docker_image.go +++ b/tests/kubernetes-distros/kind/internal/build_docker_image.go @@ -17,7 +17,6 @@ import ( const ( DEFAULT_JS_CLIENT_IMG_NAME = "host.docker.internal:5000/test-apps/js/client" DEFAULT_JS_SERVER_IMG_NAME = "host.docker.internal:5000/test-apps/js/server" - DEFAULT_PYTHON_IMG_NAME = "host.docker.internal:5000/test-apps/python-app" ) func BuildDockerImageAndExportArchive(imageName, sourceFolder, imageArchivePath string, logger *log.Logger) env.Func { diff --git a/tests/kubernetes-distros/kind/internal/context.go b/tests/kubernetes-distros/kind/internal/context.go index 447ef9c..c4c21c1 100644 --- a/tests/kubernetes-distros/kind/internal/context.go +++ b/tests/kubernetes-distros/kind/internal/context.go @@ -15,7 +15,6 @@ var ( ContextKeySendDataToLumigo = ContextKey("lumigo/upstream/send_data") ContextTestAppJsClientImageName = ContextKey("test-apps/js/client/image/name") ContextTestAppJsServerImageName = ContextKey("test-apps/js/server/image/name") - ContextTestAppPythonImageName = ContextKey("test-apps/python/image/name") ) func (c ContextKey) String() string { diff --git a/tests/kubernetes-distros/kind/internal/lumigo.go b/tests/kubernetes-distros/kind/internal/lumigo.go index b5b16ec..71ef0b6 100644 --- a/tests/kubernetes-distros/kind/internal/lumigo.go +++ b/tests/kubernetes-distros/kind/internal/lumigo.go @@ -5,7 +5,7 @@ import ( metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" ) -func NewLumigo(namespace, name, lumigoTokenSecretName, lumigoTokenSecretKey string, injectionEnabled bool, enableLogs bool) *operatorv1alpha1.Lumigo { +func NewLumigo(namespace, name, lumigoTokenSecretName, lumigoTokenSecretKey string, injectionEnabled bool) *operatorv1alpha1.Lumigo { return &operatorv1alpha1.Lumigo{ ObjectMeta: metav1.ObjectMeta{ Namespace: namespace, @@ -24,9 +24,6 @@ func NewLumigo(namespace, name, lumigoTokenSecretName, lumigoTokenSecretKey stri Enabled: &injectionEnabled, }, }, - Logging: operatorv1alpha1.LoggingSpec{ - Enabled: &enableLogs, - }, }, } } diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index 7ba48c6..8c4d9ec 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -42,7 +42,7 @@ var ( // 2. A Lumigo operator installed into the Kubernetes cluster referenced by the // `kubectl` configuration -func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { +func TestLumigoOperatorEventsAndObjects(t *testing.T) { logger := testr.New(t) testAppDeploymentFeature := features.New("TestApp"). @@ -77,7 +77,7 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { t.Fatal(err) } - lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true, true) + lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true) r, err := resources.New(client.RESTConfig()) if err != nil { @@ -87,7 +87,8 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { r.Create(ctx, lumigo) deploymentName := "testdeployment" - logOutput := "I AM ALIIIIIIVE!" + testImage := "python" + logOutput := "IT'S ALIIIIIIVE!" tr := true var g int64 = 5678 @@ -123,8 +124,8 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { Containers: []corev1.Container{ { Name: "myapp", - Image: ctx.Value(internal.ContextTestAppPythonImageName).(string), - Command: []string{"python", "app.py", logOutput}, + Image: testImage, + Command: []string{"python", "-c", fmt.Sprintf("while True: print(\"%s\"); import time; time.sleep(5)", logOutput)}, }, }, }, @@ -351,8 +352,6 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { t.Fatalf("No log data found in '%s'", logsPath) } - foundApplicationLogs := false - /* * Logs come in multiple lines, and two different scopes; we need to split by '\n'. * bufio.NewScanner fails because our lines are "too long" (LOL). @@ -365,17 +364,6 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { l := exportRequest.Logs().ResourceLogs().Len() for i := 0; i < l; i++ { resourceLogs := exportRequest.Logs().ResourceLogs().At(i) - - for j := 0; j < resourceLogs.ScopeLogs().Len(); j++ { - scopeLogs := resourceLogs.ScopeLogs().At(j) - - // Make sure that applications logs are exported as well, - // and not only the operator built-in logs for events and objects - if !strings.Contains(scopeLogs.Scope().Name(), "lumigo") { - foundApplicationLogs = true - } - } - resourceAttributes := resourceLogs.Resource().Attributes().AsRaw() if actualClusterName, found := resourceAttributes["k8s.cluster.name"]; !found { @@ -392,10 +380,6 @@ func TestLumigoOperatorEventsObjectsAndLogs(t *testing.T) { } } - if !foundApplicationLogs { - t.Fatalf("No application logs were found in the logs. Make sure that the test-application logs are emitted by checking %s", logsPath) - } - return ctx }). Assess("Usage heartbeat is sent for instrumented namespaces", func(ctx context.Context, t *testing.T, c *envconf.Config) context.Context { diff --git a/tests/kubernetes-distros/kind/lumigooperator_traces_test.go b/tests/kubernetes-distros/kind/lumigooperator_traces_test.go index 517e107..610915e 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_traces_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_traces_test.go @@ -76,7 +76,7 @@ func TestLumigoOperatorTraces(t *testing.T) { t.Fatal(err) } - lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true, false) + lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true) r, err := resources.New(client.RESTConfig()) if err != nil { diff --git a/tests/kubernetes-distros/kind/main_test.go b/tests/kubernetes-distros/kind/main_test.go index 6e63de8..f3eef20 100644 --- a/tests/kubernetes-distros/kind/main_test.go +++ b/tests/kubernetes-distros/kind/main_test.go @@ -191,9 +191,6 @@ func TestMain(m *testing.M) { testJsServerImageName := fmt.Sprintf("%s:%s", internal.DEFAULT_JS_SERVER_IMG_NAME, runId) testJsServerImageArchivePath := filepath.Join(tmpDir, "test-js-server.tgz") - testPythonImageName := fmt.Sprintf("%s:%s", internal.DEFAULT_PYTHON_IMG_NAME, runId) - testPythonImageArchivePath := filepath.Join(tmpDir, "test-python.tgz") - ctx := context.WithValue(context.Background(), internal.ContextKeyRunId, runId) ctx = context.WithValue(ctx, internal.ContextKeyKubernetesClusterName, kindClusterName) ctx = context.WithValue(ctx, internal.ContextKeyOtlpSinkConfigPath, dataSinkConfigDir) @@ -206,7 +203,6 @@ func TestMain(m *testing.M) { ctx = context.WithValue(ctx, internal.ContextKeyOperatorTelemetryProxyImage, telemetryProxyImageName) ctx = context.WithValue(ctx, internal.ContextTestAppJsClientImageName, testJsClientImageName) ctx = context.WithValue(ctx, internal.ContextTestAppJsServerImageName, testJsServerImageName) - ctx = context.WithValue(ctx, internal.ContextTestAppPythonImageName, testPythonImageName) testEnv = env.NewWithConfig(cfg).WithContext(ctx) @@ -219,7 +215,6 @@ func TestMain(m *testing.M) { internal.BuildDockerImageAndExportArchive(telemetryProxyImageName, filepath.Join(repoRoot, "telemetryproxy"), telemetryProxyImageArchivePath, logger), internal.BuildDockerImageAndExportArchive(testJsClientImageName, filepath.Join(cwd, "apps", "client"), testJsClientImageArchivePath, logger), internal.BuildDockerImageAndExportArchive(testJsServerImageName, filepath.Join(cwd, "apps", "server"), testJsServerImageArchivePath, logger), - internal.BuildDockerImageAndExportArchive(testPythonImageName, filepath.Join(cwd, "apps", "python"), testPythonImageArchivePath, logger), envfuncs.CreateKindClusterWithConfig(kindClusterName, kindNodeImageVal, kindConfigPath), @@ -227,8 +222,6 @@ func TestMain(m *testing.M) { internal.LoadDockerImageArchiveToCluster(kindClusterName, telemetryProxyImageArchivePath, logger), internal.LoadDockerImageArchiveToCluster(kindClusterName, testJsClientImageArchivePath, logger), internal.LoadDockerImageArchiveToCluster(kindClusterName, testJsServerImageArchivePath, logger), - internal.LoadDockerImageArchiveToCluster(kindClusterName, testPythonImageArchivePath, logger), - /* * Otel Collector image is on Docker hub, no need to pull it into Kind (pulling into Kind * works only for local image, in the local Docker daemon). diff --git a/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl b/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl index 2e88f9d..fa5aac3 100644 --- a/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl +++ b/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl @@ -6,10 +6,4 @@ nodes: - hostPath: '{{OTLP_SINK_CONFIG_VOLUME_PATH}}' containerPath: /lumigo/otlp-sink/config - hostPath: '{{OTLP_SINK_DATA_VOLUME_PATH}}' - containerPath: /lumigo/otlp-sink/data - kubeadmConfigPatches: - - | - kind: InitConfiguration - nodeRegistration: - kubeletExtraArgs: - system-reserved: memory=4Gi \ No newline at end of file + containerPath: /lumigo/otlp-sink/data \ No newline at end of file From cd318f4df16e41918750b4b3ddcf666bd077f465 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sat, 8 Jun 2024 21:32:23 +0300 Subject: [PATCH 25/30] Add a Python test-image with custom logging --- .../kubernetes-distros/kind/apps/python/Dockerfile | 9 +++++++++ tests/kubernetes-distros/kind/apps/python/app.py | 10 ++++++++++ .../kind/internal/build_docker_image.go | 1 + tests/kubernetes-distros/kind/internal/context.go | 1 + .../kind/lumigooperator_logs_test.go | 14 ++++++++++---- tests/kubernetes-distros/kind/main_test.go | 7 +++++++ .../kind/resources/kind-config.yaml.tpl | 8 +++++++- 7 files changed, 45 insertions(+), 5 deletions(-) create mode 100644 tests/kubernetes-distros/kind/apps/python/Dockerfile create mode 100644 tests/kubernetes-distros/kind/apps/python/app.py diff --git a/tests/kubernetes-distros/kind/apps/python/Dockerfile b/tests/kubernetes-distros/kind/apps/python/Dockerfile new file mode 100644 index 0000000..60008db --- /dev/null +++ b/tests/kubernetes-distros/kind/apps/python/Dockerfile @@ -0,0 +1,9 @@ +FROM python:3.9-slim + +WORKDIR /code + +COPY ./app.py /code/app.py + +LABEL distro-version='DEV' + +CMD ["python", "app.py", "something to say to the logs"] \ No newline at end of file diff --git a/tests/kubernetes-distros/kind/apps/python/app.py b/tests/kubernetes-distros/kind/apps/python/app.py new file mode 100644 index 0000000..4484a0f --- /dev/null +++ b/tests/kubernetes-distros/kind/apps/python/app.py @@ -0,0 +1,10 @@ +import sys +import time +import logging + +logger = logging.getLogger("test") +logger.setLevel(logging.DEBUG) + +while True: + logger.info(sys.argv[1]) + time.sleep(5) \ No newline at end of file diff --git a/tests/kubernetes-distros/kind/internal/build_docker_image.go b/tests/kubernetes-distros/kind/internal/build_docker_image.go index b62fc8c..da41c30 100644 --- a/tests/kubernetes-distros/kind/internal/build_docker_image.go +++ b/tests/kubernetes-distros/kind/internal/build_docker_image.go @@ -17,6 +17,7 @@ import ( const ( DEFAULT_JS_CLIENT_IMG_NAME = "host.docker.internal:5000/test-apps/js/client" DEFAULT_JS_SERVER_IMG_NAME = "host.docker.internal:5000/test-apps/js/server" + DEFAULT_PYTHON_IMG_NAME = "host.docker.internal:5000/test-apps/python-app" ) func BuildDockerImageAndExportArchive(imageName, sourceFolder, imageArchivePath string, logger *log.Logger) env.Func { diff --git a/tests/kubernetes-distros/kind/internal/context.go b/tests/kubernetes-distros/kind/internal/context.go index c4c21c1..447ef9c 100644 --- a/tests/kubernetes-distros/kind/internal/context.go +++ b/tests/kubernetes-distros/kind/internal/context.go @@ -15,6 +15,7 @@ var ( ContextKeySendDataToLumigo = ContextKey("lumigo/upstream/send_data") ContextTestAppJsClientImageName = ContextKey("test-apps/js/client/image/name") ContextTestAppJsServerImageName = ContextKey("test-apps/js/server/image/name") + ContextTestAppPythonImageName = ContextKey("test-apps/python/image/name") ) func (c ContextKey) String() string { diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index 8c4d9ec..280cc74 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -23,6 +23,7 @@ import ( appsv1 "k8s.io/api/apps/v1" corev1 "k8s.io/api/core/v1" + "k8s.io/apimachinery/pkg/api/resource" metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" "k8s.io/apimachinery/pkg/apis/meta/v1/unstructured" @@ -87,8 +88,6 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { r.Create(ctx, lumigo) deploymentName := "testdeployment" - testImage := "python" - logOutput := "IT'S ALIIIIIIVE!" tr := true var g int64 = 5678 @@ -124,8 +123,15 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { Containers: []corev1.Container{ { Name: "myapp", - Image: testImage, - Command: []string{"python", "-c", fmt.Sprintf("while True: print(\"%s\"); import time; time.sleep(5)", logOutput)}, + Image: ctx.Value(internal.ContextTestAppPythonImageName).(string), + Resources: corev1.ResourceRequirements{ + Limits: corev1.ResourceList{ + corev1.ResourceMemory: resource.MustParse("1Gi"), + }, + Requests: corev1.ResourceList{ + corev1.ResourceMemory: resource.MustParse("768Mi"), + }, + }, }, }, }, diff --git a/tests/kubernetes-distros/kind/main_test.go b/tests/kubernetes-distros/kind/main_test.go index f3eef20..6e63de8 100644 --- a/tests/kubernetes-distros/kind/main_test.go +++ b/tests/kubernetes-distros/kind/main_test.go @@ -191,6 +191,9 @@ func TestMain(m *testing.M) { testJsServerImageName := fmt.Sprintf("%s:%s", internal.DEFAULT_JS_SERVER_IMG_NAME, runId) testJsServerImageArchivePath := filepath.Join(tmpDir, "test-js-server.tgz") + testPythonImageName := fmt.Sprintf("%s:%s", internal.DEFAULT_PYTHON_IMG_NAME, runId) + testPythonImageArchivePath := filepath.Join(tmpDir, "test-python.tgz") + ctx := context.WithValue(context.Background(), internal.ContextKeyRunId, runId) ctx = context.WithValue(ctx, internal.ContextKeyKubernetesClusterName, kindClusterName) ctx = context.WithValue(ctx, internal.ContextKeyOtlpSinkConfigPath, dataSinkConfigDir) @@ -203,6 +206,7 @@ func TestMain(m *testing.M) { ctx = context.WithValue(ctx, internal.ContextKeyOperatorTelemetryProxyImage, telemetryProxyImageName) ctx = context.WithValue(ctx, internal.ContextTestAppJsClientImageName, testJsClientImageName) ctx = context.WithValue(ctx, internal.ContextTestAppJsServerImageName, testJsServerImageName) + ctx = context.WithValue(ctx, internal.ContextTestAppPythonImageName, testPythonImageName) testEnv = env.NewWithConfig(cfg).WithContext(ctx) @@ -215,6 +219,7 @@ func TestMain(m *testing.M) { internal.BuildDockerImageAndExportArchive(telemetryProxyImageName, filepath.Join(repoRoot, "telemetryproxy"), telemetryProxyImageArchivePath, logger), internal.BuildDockerImageAndExportArchive(testJsClientImageName, filepath.Join(cwd, "apps", "client"), testJsClientImageArchivePath, logger), internal.BuildDockerImageAndExportArchive(testJsServerImageName, filepath.Join(cwd, "apps", "server"), testJsServerImageArchivePath, logger), + internal.BuildDockerImageAndExportArchive(testPythonImageName, filepath.Join(cwd, "apps", "python"), testPythonImageArchivePath, logger), envfuncs.CreateKindClusterWithConfig(kindClusterName, kindNodeImageVal, kindConfigPath), @@ -222,6 +227,8 @@ func TestMain(m *testing.M) { internal.LoadDockerImageArchiveToCluster(kindClusterName, telemetryProxyImageArchivePath, logger), internal.LoadDockerImageArchiveToCluster(kindClusterName, testJsClientImageArchivePath, logger), internal.LoadDockerImageArchiveToCluster(kindClusterName, testJsServerImageArchivePath, logger), + internal.LoadDockerImageArchiveToCluster(kindClusterName, testPythonImageArchivePath, logger), + /* * Otel Collector image is on Docker hub, no need to pull it into Kind (pulling into Kind * works only for local image, in the local Docker daemon). diff --git a/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl b/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl index fa5aac3..2e88f9d 100644 --- a/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl +++ b/tests/kubernetes-distros/kind/resources/kind-config.yaml.tpl @@ -6,4 +6,10 @@ nodes: - hostPath: '{{OTLP_SINK_CONFIG_VOLUME_PATH}}' containerPath: /lumigo/otlp-sink/config - hostPath: '{{OTLP_SINK_DATA_VOLUME_PATH}}' - containerPath: /lumigo/otlp-sink/data \ No newline at end of file + containerPath: /lumigo/otlp-sink/data + kubeadmConfigPatches: + - | + kind: InitConfiguration + nodeRegistration: + kubeletExtraArgs: + system-reserved: memory=4Gi \ No newline at end of file From 022b0512cd7c9d5452fe94f81bfb2a5dd58bbae4 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sat, 8 Jun 2024 21:42:25 +0300 Subject: [PATCH 26/30] Failing test - waiting for injector update --- .../kind/lumigooperator_logs_test.go | 11 +++++++++++ 1 file changed, 11 insertions(+) diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index 280cc74..733e2a8 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -358,6 +358,8 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { t.Fatalf("No log data found in '%s'", logsPath) } + foundApplicationLogs := false + /* * Logs come in multiple lines, and two different scopes; we need to split by '\n'. * bufio.NewScanner fails because our lines are "too long" (LOL). @@ -370,6 +372,11 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { l := exportRequest.Logs().ResourceLogs().Len() for i := 0; i < l; i++ { resourceLogs := exportRequest.Logs().ResourceLogs().At(i) + + if !strings.HasPrefix(resourceLogs.ScopeLogs().AppendEmpty().Scope().Name(), "lumigo-operator.") { + foundApplicationLogs = false + } + resourceAttributes := resourceLogs.Resource().Attributes().AsRaw() if actualClusterName, found := resourceAttributes["k8s.cluster.name"]; !found { @@ -386,6 +393,10 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { } } + if !foundApplicationLogs { + t.Fatalf("No application logs found in '%s'. \r\nMake sure the application has LUMIGO_ENABLE_LOGS=true and is emitting using a supported logger", logsPath) + } + return ctx }). Assess("Usage heartbeat is sent for instrumented namespaces", func(ctx context.Context, t *testing.T, c *envconf.Config) context.Context { From 27df8c6c6a4199ce1b0c773624818f1cf0814e9c Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 9 Jun 2024 08:20:39 +0300 Subject: [PATCH 27/30] Fix typo --- tests/kubernetes-distros/kind/lumigooperator_logs_test.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index 733e2a8..f35e80d 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -394,7 +394,7 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { } if !foundApplicationLogs { - t.Fatalf("No application logs found in '%s'. \r\nMake sure the application has LUMIGO_ENABLE_LOGS=true and is emitting using a supported logger", logsPath) + t.Fatalf("No application logs found in '%s'. \r\nMake sure the application has LUMIGO_ENABLE_LOGS=true and is emitting logs using a supported logger", logsPath) } return ctx From 6ca798783c51f389bfca7ff85209acc41f12baf7 Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 9 Jun 2024 11:52:20 +0300 Subject: [PATCH 28/30] Finalize Python logging setup --- .../kind/apps/python/app.py | 13 ++- .../kind/internal/lumigo.go | 5 +- .../kind/lumigooperator_logs_test.go | 97 +++++++++++++++---- .../kind/lumigooperator_traces_test.go | 2 +- 4 files changed, 93 insertions(+), 24 deletions(-) diff --git a/tests/kubernetes-distros/kind/apps/python/app.py b/tests/kubernetes-distros/kind/apps/python/app.py index 4484a0f..f26ef26 100644 --- a/tests/kubernetes-distros/kind/apps/python/app.py +++ b/tests/kubernetes-distros/kind/apps/python/app.py @@ -1,10 +1,17 @@ import sys import time import logging +from lumigo_opentelemetry import logger_provider logger = logging.getLogger("test") -logger.setLevel(logging.DEBUG) +logger.setLevel(logging.INFO) + +# Non-mandatory in our OTEL setup, but recommended for troubleshooting - adds a console handler to see the logs in the console +console_handler = logging.StreamHandler() +console_handler.setLevel(logging.INFO) +logger.addHandler(console_handler) while True: - logger.info(sys.argv[1]) - time.sleep(5) \ No newline at end of file + logger.info(sys.argv[1] if len(sys.argv) > 1 else "Hello, World!") + logger_provider.force_flush() + time.sleep(5) \ No newline at end of file diff --git a/tests/kubernetes-distros/kind/internal/lumigo.go b/tests/kubernetes-distros/kind/internal/lumigo.go index 71ef0b6..b9e4742 100644 --- a/tests/kubernetes-distros/kind/internal/lumigo.go +++ b/tests/kubernetes-distros/kind/internal/lumigo.go @@ -5,7 +5,7 @@ import ( metav1 "k8s.io/apimachinery/pkg/apis/meta/v1" ) -func NewLumigo(namespace, name, lumigoTokenSecretName, lumigoTokenSecretKey string, injectionEnabled bool) *operatorv1alpha1.Lumigo { +func NewLumigo(namespace, name, lumigoTokenSecretName, lumigoTokenSecretKey string, injectionEnabled bool, enableLogging bool) *operatorv1alpha1.Lumigo { return &operatorv1alpha1.Lumigo{ ObjectMeta: metav1.ObjectMeta{ Namespace: namespace, @@ -24,6 +24,9 @@ func NewLumigo(namespace, name, lumigoTokenSecretName, lumigoTokenSecretKey stri Enabled: &injectionEnabled, }, }, + Logging: operatorv1alpha1.LoggingSpec{ + Enabled: &enableLogging, + }, }, } } diff --git a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go index f35e80d..dfc6c73 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_logs_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_logs_test.go @@ -78,7 +78,7 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { t.Fatal(err) } - lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true) + lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true, true) r, err := resources.New(client.RESTConfig()) if err != nil { @@ -358,8 +358,6 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { t.Fatalf("No log data found in '%s'", logsPath) } - foundApplicationLogs := false - /* * Logs come in multiple lines, and two different scopes; we need to split by '\n'. * bufio.NewScanner fails because our lines are "too long" (LOL). @@ -372,11 +370,6 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { l := exportRequest.Logs().ResourceLogs().Len() for i := 0; i < l; i++ { resourceLogs := exportRequest.Logs().ResourceLogs().At(i) - - if !strings.HasPrefix(resourceLogs.ScopeLogs().AppendEmpty().Scope().Name(), "lumigo-operator.") { - foundApplicationLogs = false - } - resourceAttributes := resourceLogs.Resource().Attributes().AsRaw() if actualClusterName, found := resourceAttributes["k8s.cluster.name"]; !found { @@ -393,10 +386,6 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { } } - if !foundApplicationLogs { - t.Fatalf("No application logs found in '%s'. \r\nMake sure the application has LUMIGO_ENABLE_LOGS=true and is emitting logs using a supported logger", logsPath) - } - return ctx }). Assess("Usage heartbeat is sent for instrumented namespaces", func(ctx context.Context, t *testing.T, c *envconf.Config) context.Context { @@ -446,6 +435,52 @@ func TestLumigoOperatorEventsAndObjects(t *testing.T) { return ctx }). + Assess("Application logs are collected successfully and added k8s.* attributes", func(ctx context.Context, t *testing.T, c *envconf.Config) context.Context { + otlpSinkDataPath := ctx.Value(internal.ContextKeyOtlpSinkDataPath).(string) + logsPath := filepath.Join(otlpSinkDataPath, "logs.json") + + if err := apimachinerywait.PollImmediateUntilWithContext(ctx, time.Second*5, func(context.Context) (bool, error) { + logsBytes, err := os.ReadFile(logsPath) + if err != nil { + return false, err + } + + if len(logsBytes) < 1 { + return false, err + } + + applicationLogs := make([]plog.LogRecord, 0) + + /* + * Logs come in multiple lines, and two different scopes; we need to split by '\n'. + * bufio.NewScanner fails because our lines are "too long" (LOL). + */ + exportRequests := strings.Split(string(logsBytes), "\n") + for _, exportRequestJson := range exportRequests { + exportRequest := plogotlp.NewExportRequest() + exportRequest.UnmarshalJSON([]byte(exportRequestJson)) + + if appLogs, err := exportRequestToApplicationLogRecords(exportRequest); err != nil { + t.Fatalf("Cannot extract logs from export request: %v", err) + } else { + applicationLogs = append(applicationLogs, appLogs...) + } + } + + if len(applicationLogs) < 1 { + // No application logs received yet + t.Fatalf("No application logs found in '%s'. \r\nMake sure the application has LUMIGO_ENABLE_LOGS=true and is emitting logs using a supported logger", logsPath) + return false, nil + } + + t.Logf("Found application logs: %d", len(applicationLogs)) + return true, nil + }); err != nil { + t.Fatalf("Failed to wait for application logs: %v", err) + } + + return ctx + }). Feature() testEnv.Test(t, testAppDeploymentFeature) @@ -570,20 +605,44 @@ func exportRequestToHeartbeatLogRecords(exportRequest plogotlp.ExportRequest) ([ return eventLogs, nil } +func exportRequestToApplicationLogRecords(exportRequest plogotlp.ExportRequest) ([]plog.LogRecord, error) { + applicationLogs := make([]plog.LogRecord, 0) + logs := exportRequest.Logs() + + l := logs.ResourceLogs().Len() + for i := 0; i < l; i++ { + e, err := resourceLogsToApplicationLogRecords(logs.ResourceLogs().At(i)) + if err != nil { + return nil, err + } + + applicationLogs = append(applicationLogs, e...) + } + + return applicationLogs, nil +} + +func resourceLogsToApplicationLogRecords(resourceLogs plog.ResourceLogs) ([]plog.LogRecord, error) { + return resourceLogsToScopedLogRecords(resourceLogs, "opentelemetry.sdk._logs._internal") +} + func resourceLogsToHeartbeatLogRecords(resourceLogs plog.ResourceLogs) ([]plog.LogRecord, error) { + return resourceLogsToScopedLogRecords(resourceLogs, "lumigo-operator.namespace_heartbeat") +} + +func resourceLogsToScopedLogRecords(resourceLogs plog.ResourceLogs, filteredScopeName string) ([]plog.LogRecord, error) { l := resourceLogs.ScopeLogs().Len() - heartbeatLogRecords := make([]plog.LogRecord, 0) + filteredScopeLogRecords := make([]plog.LogRecord, 0) + for i := 0; i < l; i++ { scopeLogs := resourceLogs.ScopeLogs().At(i) scopeName := scopeLogs.Scope().Name() logRecords := scopeLogsToLogRecords(scopeLogs) - switch scopeName { - case "lumigo-operator.namespace_heartbeat": - { - heartbeatLogRecords = append(heartbeatLogRecords, logRecords...) - } + if scopeName == filteredScopeName { + filteredScopeLogRecords = append(filteredScopeLogRecords, logRecords...) } } - return heartbeatLogRecords, nil + + return filteredScopeLogRecords, nil } diff --git a/tests/kubernetes-distros/kind/lumigooperator_traces_test.go b/tests/kubernetes-distros/kind/lumigooperator_traces_test.go index 610915e..517e107 100644 --- a/tests/kubernetes-distros/kind/lumigooperator_traces_test.go +++ b/tests/kubernetes-distros/kind/lumigooperator_traces_test.go @@ -76,7 +76,7 @@ func TestLumigoOperatorTraces(t *testing.T) { t.Fatal(err) } - lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true) + lumigo := internal.NewLumigo(namespaceName, "lumigo", lumigoTokenName, lumigoTokenKey, true, false) r, err := resources.New(client.RESTConfig()) if err != nil { From 8da74ce4e6d84bf30aaffd37855c3dd31c8cb9fe Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 9 Jun 2024 16:37:57 +0300 Subject: [PATCH 29/30] Temp disable test-telemetry-proxy-for-security-issues --- .github/workflows/build-test-release.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build-test-release.yml b/.github/workflows/build-test-release.yml index 5842288..a2803b2 100644 --- a/.github/workflows/build-test-release.yml +++ b/.github/workflows/build-test-release.yml @@ -342,7 +342,7 @@ jobs: - test-kustomize - test-kind - test-controller-for-security-issues - - test-telemetry-proxy-for-security-issues + # - test-telemetry-proxy-for-security-issues steps: - name: no-op run: echo '*tongue click* noice' @@ -596,7 +596,7 @@ jobs: run: | LUMIGO_AUTOTRACE_LATEST_VERSION=$(aws ecr describe-images --region us-east-1 --registry-id 709825985650 --repository-name lumigo/lumigo-autotrace --query 'sort_by(imageDetails,& imagePushedAt)[-2].imageTags[0]' --output text) echo "LUMIGO_AUTOTRACE_LATEST_VERSION=$LUMIGO_AUTOTRACE_LATEST_VERSION" - + yq e -i ".injectorWebhook.lumigoInjector.image.repository = \"${{ matrix.ecr-registry }}/lumigo/lumigo-autotrace\"" charts/lumigo-operator/values.yaml yq e -i ".injectorWebhook.lumigoInjector.image.tag = \"$LUMIGO_AUTOTRACE_LATEST_VERSION\"" charts/lumigo-operator/values.yaml yq e -i "(select(documentIndex == 1).spec.template.spec.containers[] | select(.name == \"manager\").env[] | select(.name == \"LUMIGO_INJECTOR_IMAGE\")).value = \"${{ matrix.ecr-registry }}/lumigo/lumigo-autotrace:$LUMIGO_AUTOTRACE_LATEST_VERSION\"" config/manager/manager.yaml From a7c9fbdba47018c9f0819f7979dbcc4f43f91f3f Mon Sep 17 00:00:00 2001 From: Harel Moshe Date: Sun, 9 Jun 2024 17:11:43 +0300 Subject: [PATCH 30/30] Revert "Temp disable test-telemetry-proxy-for-security-issues" This reverts commit 8da74ce4e6d84bf30aaffd37855c3dd31c8cb9fe. --- .github/workflows/build-test-release.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/build-test-release.yml b/.github/workflows/build-test-release.yml index a2803b2..5842288 100644 --- a/.github/workflows/build-test-release.yml +++ b/.github/workflows/build-test-release.yml @@ -342,7 +342,7 @@ jobs: - test-kustomize - test-kind - test-controller-for-security-issues - # - test-telemetry-proxy-for-security-issues + - test-telemetry-proxy-for-security-issues steps: - name: no-op run: echo '*tongue click* noice' @@ -596,7 +596,7 @@ jobs: run: | LUMIGO_AUTOTRACE_LATEST_VERSION=$(aws ecr describe-images --region us-east-1 --registry-id 709825985650 --repository-name lumigo/lumigo-autotrace --query 'sort_by(imageDetails,& imagePushedAt)[-2].imageTags[0]' --output text) echo "LUMIGO_AUTOTRACE_LATEST_VERSION=$LUMIGO_AUTOTRACE_LATEST_VERSION" - + yq e -i ".injectorWebhook.lumigoInjector.image.repository = \"${{ matrix.ecr-registry }}/lumigo/lumigo-autotrace\"" charts/lumigo-operator/values.yaml yq e -i ".injectorWebhook.lumigoInjector.image.tag = \"$LUMIGO_AUTOTRACE_LATEST_VERSION\"" charts/lumigo-operator/values.yaml yq e -i "(select(documentIndex == 1).spec.template.spec.containers[] | select(.name == \"manager\").env[] | select(.name == \"LUMIGO_INJECTOR_IMAGE\")).value = \"${{ matrix.ecr-registry }}/lumigo/lumigo-autotrace:$LUMIGO_AUTOTRACE_LATEST_VERSION\"" config/manager/manager.yaml