SeldonIO · ryandawsonuk · May 31, 2019 · May 31, 2019 · May 31, 2019 · Jun 3, 2019
diff --git a/engine/src/main/java/io/seldon/engine/api/rest/RestClientController.java b/engine/src/main/java/io/seldon/engine/api/rest/RestClientController.java
@@ -48,7 +48,8 @@
 public class RestClientController {
 
 	private static Logger logger = LoggerFactory.getLogger(RestClientController.class.getName());
-
+
+
 	@Autowired
 	private PredictionService predictionService;
 
@@ -150,8 +151,8 @@ public ResponseEntity<String> predictions(RequestEntity<String> requestEntity)
 		try
 		{
 			SeldonMessage response = predictionService.predict(request);
-			String json = ProtoBufUtils.toJson(response);
-			return new ResponseEntity<String>(json,HttpStatus.OK);
+			String responseJson = ProtoBufUtils.toJson(response);
+			return new ResponseEntity<String>(responseJson,HttpStatus.OK);
 		}
 		 catch (InterruptedException e) {
 			throw new APIException(ApiExceptionType.ENGINE_INTERRUPTED,e.getMessage());

diff --git a/engine/src/main/java/io/seldon/engine/service/PredictionService.java b/engine/src/main/java/io/seldon/engine/service/PredictionService.java
@@ -18,13 +18,13 @@
 import java.math.BigInteger;
 import java.security.SecureRandom;
 import java.util.concurrent.ExecutionException;
-import java.util.concurrent.ExecutorService;
-import java.util.concurrent.Executors;
 
+import io.seldon.engine.pb.ProtoBufUtils;
 import org.apache.commons.lang3.StringUtils;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 import org.springframework.beans.factory.annotation.Autowired;
+import org.springframework.beans.factory.annotation.Value;
 import org.springframework.stereotype.Service;
 
 import com.google.protobuf.InvalidProtocolBufferException;
@@ -49,6 +49,16 @@ public class PredictionService {
 
 	PuidGenerator puidGenerator = new PuidGenerator();
 
+	@Value("${log.requests}")
+	private boolean logRequests;
+
+	@Value("${log.responses}")
+	private boolean logResponses;
+
+	@Value("${log.feedback.requests}")
+	private boolean logFeedbackRequests;
+
+
 	public final class PuidGenerator {
 	    private SecureRandom random = new SecureRandom();
 
@@ -62,6 +72,10 @@ public void sendFeedback(Feedback feedback) throws InterruptedException, Executi
 		PredictorState predictorState = predictorBean.predictorStateFromPredictorSpec(enginePredictor.getPredictorSpec());
 
 		predictorBean.sendFeedback(feedback, predictorState);
+
+		if(logFeedbackRequests) {
+			logRawMessageAsJson(feedback);
+		}
 
 		return;
 	}
@@ -85,7 +99,33 @@ else if (StringUtils.isEmpty(request.getMeta().getPuid()))
 
         SeldonMessage.Builder builder = SeldonMessage.newBuilder(predictorReturn).setMeta(Meta.newBuilder(predictorReturn.getMeta()).setPuid(puid));
 
-        return builder.build();
+        SeldonMessage response = builder.build();
+
+		if(logRequests){
+			//log pure json now we've added puid
+			logRawMessageAsJson(request);
+		}
+		if(logResponses){
+			logRawMessageAsJson(response);
+		}
+
+        return response;
 
 	}
+
+	private void logRawMessageAsJson(SeldonMessage message){
+		try {
+			System.out.println(ProtoBufUtils.toJson(message).replace("\n", "").replace("\r", ""));
+		}catch (Exception ex){
+			logger.error("Unable to parse message",ex);
+		}
+	}
+
+	private void logRawMessageAsJson(Feedback message){
+		try {
+			System.out.println(ProtoBufUtils.toJson(message).replace("\n", "").replace("\r", ""));
+		}catch (Exception ex){
+			logger.error("Unable to parse message",ex);
+		}
+	}
 }
diff --git a/engine/src/main/resources/application.properties b/engine/src/main/resources/application.properties
@@ -14,4 +14,8 @@ spring.jmx.enabled = false
 
 logging.file=
 logging.level.root=WARN
-logging.level.io.seldon=${SELDON_LOG_LEVEL:INFO}
+logging.level.io.seldon=${SELDON_LOG_LEVEL:INFO}
+
+log.requests=${SELDON_LOG_REQUESTS:true}
+log.responses=${SELDON_LOG_RESPONSES:true}
+log.feedback.requests=${SELDON_LOG_FEEDBACK_REQUESTS:true}
diff --git a/engine/src/test/resources/application.properties b/engine/src/test/resources/application.properties
@@ -1,2 +1,5 @@
 server.port = 8081
 
+log.requests=${SELDON_LOG_REQUESTS:true}
+log.responses=${SELDON_LOG_RESPONSES:true}
+log.feedback.requests=${SELDON_LOG_FEEDBACK_REQUESTS:true}
diff --git a/examples/centralised-logging/README.md b/examples/centralised-logging/README.md
@@ -0,0 +1,102 @@
+# Centralised Logging Example
+
+## Introduction
+
+Here we will set up EFK (elasticsearch, fluentbit, kibana) as a stack to gather logs from SeldonDeployments and make them searchable.
+
+This demo is aimed at minikube and loosely based on https://www.katacoda.com/javajon/courses/kubernetes-observability/efk
+
+Alternatives are available and if you are running in cloud then you can consider a managed service from your cloud provider.
+
+## Setup
+
+If helm is not already set up then it needs to be configured:
+
+```
+kubectl -n kube-system create sa tiller
+kubectl create clusterrolebinding tiller --clusterrole cluster-admin --serviceaccount=kube-system:tiller
+helm init --service-account tiller
+```
+
+First setup elasticsearch helm repo:
+
+```
+helm repo add elastic https://helm.elastic.co
+```
+
+Next install elasticsearch with minikube configuration:
+
+```
+helm install --name elasticsearch elastic/elasticsearch --version 7.1.0 --namespace=logs -f elastic-minikube.yaml
+```
+
+Then fluentbit as a collection agent:
+
+```
+helm install stable/fluent-bit --name=fluent-bit --namespace=logs --set backend.type=es --set backend.es.host=elasticsearch-master
+```
+
+And kibana UI:
+
+```
+helm install elastic/kibana --version 7.1.0 --name=kibana --namespace=logs --set service.type=NodePort
+```
+
+## Generating Logging
+
+First we need seldon and a seldon deployment.
+
+Install seldon operator:
+
+```
+helm install seldon-core-operator --name seldon-core --namespace seldon-system --repo https://storage.googleapis.com/seldon-charts
+```
+
+Now a model:
+
+```
+helm install seldon-single-model --name seldon-single-model --repo https://storage.googleapis.com/seldon-charts
+```
+
+And the loadtester:
+
+```
+kubectl label nodes $(kubectl get nodes -o jsonpath='{.items[0].metadata.name}') role=locust --overwrite
+helm install seldon-core-loadtesting --name seldon-core-loadtesting --repo https://storage.googleapis.com/seldon-charts --set locust.host=http://seldon-single-model-seldon-single-model:8000 --set oauth.enabled=false --set oauth.key=oauth-key --set oauth.secret=oauth-secret --set locust.hatchRate=1 --set locust.clients=1 --set loadtest.sendFeedback=0 --set locust.minWait=0 --set locust.maxWait=0 --set replicaCount=1
+```
+
+## Inspecting Logging and Search for Requests
+
+To find kibana URL
+
+```
+echo $(minikube ip)":"$(kubectl get svc kibana-kibana -n logs -o=jsonpath='{.spec.ports[?(@.port==5601)].nodePort}')
+```
+
+When Kibana appears for the first time there will be a brief animation while it initializes.
+On the Welcome page click Explore on my own.
+From the top-left or from the `Visualize and Explore Data` panel select the `Discover` item.
+In the form field Index pattern enter kubernetes_cluster-*
+It should read "Success!" and Click the `> Next` step button on the right.
+In the next form select timestamp from the dropdown labeled `Time Filter` field name.
+From the bottom-right of the form select `Create index pattern`.
+In a moment a list of fields will appear.
+From the top-left or the home screen's `Visualize and Explore Data` panel, select the `Discover` item.
+The log list will appear.
+Refine the list a bit by selecting `log` near the bottom the left-hand Selected fields list.
+When you hover over or click on the word `log`, click the `Add` button to the right of the label.
+You can create a filter using the `Add Filter` button under `Search`. The field can be `kubernetes.labels.seldon-app` and the value can be an 'is' match on `seldon-single-model-seldon-single-model`.
+
+The custom fields in the request bodies may not currently be in the index. If you hover over one in a request you may see `No cached mapping for this field`.
+
+To add mappings, go to `Management` at the bottom-left and then `Index Patterns`. Hit `Refresh` on the index created earlier. The number of fields should increase and `data.names` should be present.
+
+Now we can go back and add a further filter for `data.names` with the operator `exists`. We can add further filters if we want, such as the presence of a feature name or the presence of a feature value.
+
+![picture](./kibana-custom-search.png)
+
+## Notes
+
+All pods will be logged. To exclude pods see https://docs.fluentbit.io/manual/filter/kubernetes#request-to-exclude-logs
+
+In the future we may need to find a way to transform requests so that data-points are searchable due to https://discuss.elastic.co/t/query-array-by-position/124765
diff --git a/examples/centralised-logging/elastic-minikube.yaml b/examples/centralised-logging/elastic-minikube.yaml
@@ -0,0 +1,23 @@
+---
+# Permit co-located instances for solitary minikube virtual machines.
+antiAffinity: "soft"
+
+# Shrink default JVM heap.
+esJavaOpts: "-Xmx128m -Xms128m"
+
+# Allocate smaller chunks of memory per pod.
+resources:
+  requests:
+    cpu: "100m"
+    memory: "512M"
+  limits:
+    cpu: "1000m"
+    memory: "512M"
+
+# Request smaller persistent volumes.
+volumeClaimTemplate:
+  accessModes: [ "ReadWriteOnce" ]
+  storageClassName: "standard"
+  resources:
+    requests:
+      storage: 100M
diff --git a/examples/centralised-logging/kibana-custom-search.png b/examples/centralised-logging/kibana-custom-search.png