Update serving in mnist example; use 0.4 and add testing. (#469)

* Add the TFServing component * Create TFServing components. * The model.py code doesn't appear to be exporting a model in saved model format; it was a missing a call to export. * I'm not sure how this ever worked. * It also looks like there is a bug in the code in that its using the cnn input fn even if the model is the linear one. I'm going to leave that as is for now. * Create a namespace for each test run; delete the namespace on teardown * We need to copy the GCP service account key to the new namespace. * Add a shell script to do that.
2019-01-11 14:36:43 -08:00 · 2019-01-11 14:36:43 -08:00 · 2494fdf8c5
parent ef108dbbcc
commit 2494fdf8c5
29 changed files with 1813 additions and 16 deletions
--- a/mnist/README.md
+++ b/mnist/README.md
@ -473,7 +473,74 @@ kubectl port-forward ${PODNAME} 6006:6006
 Tensorboard can now be accessed at [http://127.0.0.1:6006](http://127.0.0.1:6006).
-## Using Tensorflow serving
+## Serving the model
 The model code will export the model in saved model format which is suitable for serving with TensorFlow serving.
 To serve the model follow the instructions below. The instructins vary slightly based on where you are storing your
 model (e.g. GCS, S3, PVC). Depending on the storage system we provide different ksonnet components as a convenience
 for setting relevant environment variables.
 ### GCS
 Here we show to serve the model when it is stored on GCS. This assumes that when you trained the model you set `exportDir` to a GCS
 URI; if not you can always copy it to GCS using `gsutil`.
 Check that a model was exported
 ```
 gsutil ls -r ${EXPORT_DIR}
 ```
 The output should look something like
 ```
 gs://${EXPORT_DIR}/1547100373/saved_model.pb
 gs://${EXPORT_DIR}/1547100373/variables/:
 gs://${EXPORT_DIR}/1547100373/variables/
 gs://${EXPORT_DIR}/1547100373/variables/variables.data-00000-of-00001
 gs://${EXPORT_DIR}/1547100373/variables/variables.index
 ```
 The number `1547100373` is a version number auto-generated by TensorFlow; it will vary on each run but should be monotonically increasing if you save a model to the same location as a previous location.
 Set your model path
 ```
 ks param set ${ENV} mnist-deploy-gcp modelBasePath ${EXPORT_DIR}
 ```
 Deploy it
 ```
 ks param apply ${ENV} -c mnist-deploy-gcp
 ```
 You can check the deployment by running
 ```
 kubectl describe deployments mnist-deploy-gcp
 ```
 ### S3
 TODO: Add instructions
 ### PVC
 TODO: Add instructions
 ### Create the K8s service
 Next we need to create a K8s service to route traffic to our model
 ```
 ks apply jlewi -c mnist-service
 ```
 By default the workflow deploys our model via Tensorflow Serving. Included in this example is a client that can query your model and provide results:
--- a/mnist/ks_app/app.lock
+++ b/mnist/ks_app/app.lock
--- a/mnist/ks_app/app.yaml
+++ b/mnist/ks_app/app.yaml
@ -2,14 +2,28 @@ apiVersion: 0.3.0
 environments:
  jlewi:
    destination:
-      namespace: kubeflow
+      namespace: jlewi
      server: https://35.196.210.94
    k8sVersion: v1.11.5
    path: jlewi
  test-env-d5e3:
    destination:
      namespace: jlewi
      server: https://35.196.210.94
    k8sVersion: v1.11.5
    path: test-env-d5e3
 kind: ksonnet.io/app
 libraries:
  kubeflow/tf-serving:
    name: tf-serving
    registry: kubeflow
    version: fed535eaa276220e4edf59530c0629f4375a40a9
 name: ks_app
 registries:
  incubator:
    protocol: github
    uri: github.com/ksonnet/parts/tree/master/incubator
  kubeflow:
    protocol: github
    uri: github.com/kubeflow/kubeflow/tree/v0.4-branch/kubeflow
 version: 0.0.1
--- a/mnist/ks_app/components/mnist-deploy-aws.jsonnet
+++ b/mnist/ks_app/components/mnist-deploy-aws.jsonnet
@ -0,0 +1,39 @@
 local env = std.extVar("__ksonnet/environments");
 local params = std.extVar("__ksonnet/params").components["mnist-deploy-aws"];
 local k = import "k.libsonnet";
 local deployment = k.apps.v1beta1.deployment;
 local container = deployment.mixin.spec.template.spec.containersType;
 local util = import "kubeflow/tf-serving/util.libsonnet";
 local tfserving = import "kubeflow/tf-serving/tf-serving-template.libsonnet";
 local base = tfserving.new(env, params);
 local tfDeployment = base.tfDeployment +
                     deployment.mapContainers(
                       function(c) {
                         result::
                           c + container.withEnvMixin(
                             if util.toBool(params.s3Enable) then (
                               [
                                 {
                                   name: "AWS_ACCESS_KEY_ID",
                                   valueFrom: { secretKeyRef: { name: params.s3SecretName, key: params.s3SecretAccesskeyidKeyName } },
                                 },
                                 {
                                   name: "AWS_SECRET_ACCESS_KEY",
                                   valueFrom: { secretKeyRef: { name: params.s3SecretName, key: params.s3SecretSecretaccesskeyKeyName } },
                                 },
                                 { name: "AWS_REGION", value: params.s3AwsRegion },
                                 { name: "S3_USE_HTTPS", value: std.toString(params.s3UseHttps) },
                                 { name: "S3_VERIFY_SSL", value: std.toString(params.s3VerifySsl) },
                                 { name: "S3_ENDPOINT", value: params.s3Endpoint },
                               ]
                             ) else [],
                           ),
                       }.result,
                     );
 util.list([
  tfDeployment,
  base.tfservingConfig,
 ],)
--- a/mnist/ks_app/components/mnist-deploy-gcp.jsonnet
+++ b/mnist/ks_app/components/mnist-deploy-gcp.jsonnet
@ -0,0 +1,47 @@
 local env = std.extVar("__ksonnet/environments");
 local params = std.extVar("__ksonnet/params").components["mnist-deploy-gcp"];
 local k = import "k.libsonnet";
 local deployment = k.apps.v1beta1.deployment;
 local container = deployment.mixin.spec.template.spec.containersType;
 local util = import "kubeflow/tf-serving/util.libsonnet";
 local tfserving = import "kubeflow/tf-serving/tf-serving-template.libsonnet";
 local base = tfserving.new(env, params);
 local tfDeployment = base.tfDeployment +
                     deployment.mixin.spec.template.spec.withVolumesMixin(
                       if params.gcpCredentialSecretName != "null" then (
                         [{
                           name: "gcp-credentials",
                           secret: {
                             secretName: params.gcpCredentialSecretName,
                           },
                         }]
                       ) else [],
                     ) +
                     deployment.mapContainers(
                       function(c) {
                         result::
                           c + container.withEnvMixin(
                             if params.gcpCredentialSecretName != "null" then (
                               [{
                                 name: "GOOGLE_APPLICATION_CREDENTIALS",
                                 value: "/secret/gcp-credentials/user-gcp-sa.json",
                               }]
                             ) else [],
                           ) +
                           container.withVolumeMountsMixin(
                             if params.gcpCredentialSecretName != "null" then (
                               [{
                                 name: "gcp-credentials",
                                 mountPath: "/secret/gcp-credentials",
                               }]
                             ) else [],
                           ),
                       }.result,
                     );
 util.list([
  tfDeployment,
  base.tfservingConfig,
 ],)
--- a/mnist/ks_app/components/mnist-service.jsonnet
+++ b/mnist/ks_app/components/mnist-service.jsonnet
@ -0,0 +1,8 @@
 local env = std.extVar("__ksonnet/environments");
 local params = std.extVar("__ksonnet/params").components["mnist-service"];
 local k = import "k.libsonnet";
 local tfservingService = import "kubeflow/tf-serving/tf-serving-service-template.libsonnet";
 local util = import "kubeflow/tf-serving/util.libsonnet";
 tfservingService.new(env, params).all
--- a/mnist/ks_app/components/params.libsonnet
+++ b/mnist/ks_app/components/params.libsonnet
@ -4,15 +4,58 @@
    train: {
      batchSize: 100,
      envVariables: 'GOOGLE_APPLICATION_CREDENTIALS=/var/secrets/user-gcp-sa.json',
-      exportDir: 'gs://kubeflow-ci_temp/mnist-jlewi',
+      exportDir: 'gs://kubeflow-ci_temp/mnist-jlewi/export',
-      image: 'gcr.io/kubeflow-examples/mnist/model:v20190108-v0.2-137-g38daafa-dirty-911944',
+      image: 'gcr.io/kubeflow-examples/mnist/model:v20190111-v0.2-148-g313770f',
      learningRate: '0.01',
      modelDir: 'gs://kubeflow-ci_temp/mnist-jlewi',
      name: 'mnist-train',
-      numPs: 1,
+      numPs: 0,
-      numWorkers: 2,
+      numWorkers: 0,
      secret: '',
      trainSteps: 200,
    },
    "mnist-deploy-gcp": {
      defaultCpuImage: 'tensorflow/serving:1.11.1',
      defaultGpuImage: 'tensorflow/serving:1.11.1-gpu',
      deployHttpProxy: 'false',
      enablePrometheus: 'true',
      gcpCredentialSecretName: 'user-gcp-sa',
      httpProxyImage: '',
      injectIstio: 'false',
      modelBasePath: 'gs://kubeflow-examples-data/mnist',
      modelName: 'mnist',
      name: 'mnist-deploy-gcp',
      numGpus: '0',
      versionName: 'v1',
    },
    "mnist-deploy-aws": {
      defaultCpuImage: 'tensorflow/serving:1.11.1',
      defaultGpuImage: 'tensorflow/serving:1.11.1-gpu',
      deployHttpProxy: 'false',
      enablePrometheus: 'true',
      httpProxyImage: 'gcr.io/kubeflow-images-public/tf-model-server-http-proxy:v20180723',
      injectIstio: 'false',
      modelBasePath: 's3://kubeflow-examples-data/mnist',
      modelName: 'null',
      name: 'mnist-deploy-aws',
      numGpus: '0',
      s3AwsRegion: 'us-west-1',
      s3Enable: 'false',
      s3Endpoint: 's3.us-west-1.amazonaws.com',
      s3SecretAccesskeyidKeyName: 'AWS_ACCESS_KEY_ID',
      s3SecretName: 'null',
      s3SecretSecretaccesskeyKeyName: 'AWS_SECRET_ACCESS_KEY',
      s3UseHttps: 'true',
      s3VerifySsl: 'true',
      versionName: 'v1',
    },
    "mnist-service": {
      enablePrometheus: 'true',
      injectIstio: 'false',
      modelName: 'null',
      name: 'mnist-service',
      serviceType: 'ClusterIP',
      trafficRule: 'v1:100',
    },
  },
 }
--- a/mnist/ks_app/components/train.jsonnet
+++ b/mnist/ks_app/components/train.jsonnet
@ -43,8 +43,9 @@ local trainEnv = [
  },
 ];
-local secretName = std.split(params.secret, "=")[0];
+local secretPieces = std.split(params.secret, "=");
-local secretMountPath = std.split(params.secret, "=")[1];
+local secretName = if std.length(secretPieces) > 0 then secretPieces[0] else "";
 local secretMountPath = if std.length(secretPieces) > 1 then secretPieces[1] else "";
 local replicaSpec = {
  containers: [
--- a/mnist/ks_app/environments/jlewi/params.libsonnet
+++ b/mnist/ks_app/environments/jlewi/params.libsonnet
@ -8,6 +8,23 @@ local envParams = params + {
    train+: {
      name: 'mnist-train-dist',
      secret: 'user-gcp-sa=/var/secrets',
      numSteps: 10,
      image: 'gcr.io/kubeflow-examples/mnist/model:v20190111-v0.2-146-g0bbff62-dirty-12f353',
      numWorkers: 2,
      numPs: 1,
    },
    "deploy-gcp"+: {
      modelBasePath: 'gs://kubeflow-ci_temp/mnist-jlewi/export',
    },
    "mnist-deploy-gcp"+: {
      modelBasePath: 'gs://kubeflow-ci_temp/mnist-jlewi/export',
      name: 'jlewi-deploy-test',
      namespace: 'jlewi',
    },
    "mnist-service"+: {
      name: 'jlewi-deploy-test',
      namespace: 'jlewi',
      modelBasePath: 'gs://kubeflow-ci_temp/mnist-jlewi/export',
    },
  },
 };
--- a/mnist/ks_app/environments/test-env-d5e3/globals.libsonnet
+++ b/mnist/ks_app/environments/test-env-d5e3/globals.libsonnet
@ -0,0 +1,2 @@
 {
 }
--- a/mnist/ks_app/environments/test-env-d5e3/main.jsonnet
+++ b/mnist/ks_app/environments/test-env-d5e3/main.jsonnet
@ -0,0 +1,9 @@
 local base = import "base.libsonnet";
 // uncomment if you reference ksonnet-lib
 // local k = import "k.libsonnet";
 // local deployment = k.apps.v1beta2.deployment;
 base + {
  // Insert user-specified overrides here. For example if a component is named \"nginx-deployment\", you might have something like:\n")
  // "nginx-deployment"+: deployment.mixin.metadata.withLabels({foo: "bar"})
 }
--- a/mnist/ks_app/environments/test-env-d5e3/params.libsonnet
+++ b/mnist/ks_app/environments/test-env-d5e3/params.libsonnet
@ -0,0 +1,28 @@
 local params = std.extVar('__ksonnet/params');
 local globals = import 'globals.libsonnet';
 local envParams = params + {
  components+: {
    train+: {
      name: 'jlewi-deploy-test',
      namespace: 'jlewi',
      modelBasePath: 'gs://kubeflow-ci_temp/mnist-jlewi/export',
    },
    "mnist-deploy-gcp"+: {
      name: 'jlewi-deploy-test',
      namespace: 'jlewi',
      modelBasePath: 'gs://kubeflow-ci_temp/mnist-jlewi/export',
    },
    "mnist-service"+: {
      name: 'jlewi-deploy-test',
      namespace: 'jlewi',
      modelBasePath: 'gs://kubeflow-ci_temp/mnist-jlewi/export',
    },
  },
 };
 {
  components: {
    [x]: envParams.components[x] + globals
    for x in std.objectFields(envParams.components)
  },
 }
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/README.md
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/README.md
@ -0,0 +1,73 @@
 <!-- START doctoc generated TOC please keep comment here to allow auto update -->
 <!-- DON'T EDIT THIS SECTION, INSTEAD RE-RUN doctoc TO UPDATE -->
 **Table of Contents**  *generated with [DocToc](https://github.com/thlorenz/doctoc)*
 - [tf-serving](#tf-serving)
  - [Quickstart](#quickstart)
  - [Using the library](#using-the-library)
    - [io.ksonnet.pkg.tf-serving](#ioksonnetpkgtf-serving)
      - [Example](#example)
      - [Parameters](#parameters)
 <!-- END doctoc generated TOC please keep comment here to allow auto update -->
 # tf-serving
 > TensorFlow serving is a server for TensorFlow models.
 * [Quickstart](#quickstart)
 * [Using Prototypes](#using-prototypes)
  * [io.ksonnet.pkg.tf-serving](#io.ksonnet.pkg.tf-serving)
 ## Quickstart
 *The following commands use the `io.ksonnet.pkg.tf-serving` prototype to generate Kubernetes YAML for tf-serving, and then deploys it to your Kubernetes cluster.*
 First, create a cluster and install the ksonnet CLI (see root-level [README.md](rootReadme)).
 If you haven't yet created a [ksonnet application](linkToSomewhere), do so using `ks init <app-name>`.
 Finally, in the ksonnet application directory, run the following:
 ```shell
 # Expand prototype as a Jsonnet file, place in a file in the
 # `components/` directory. (YAML and JSON are also available.)
 $ ks prototype use io.ksonnet.pkg.tf-serving tf-serving \
  --name tf-serving \
  --namespace default
 # Apply to server.
 $ ks apply -f tf-serving.jsonnet
 ```
 ## Using the library
 The library files for tf-serving define a set of relevant *parts* (_e.g._, deployments, services, secrets, and so on) that can be combined to configure tf-serving for a wide variety of scenarios. For example, a database like Redis may need a secret to hold the user password, or it may have no password if it's acting as a cache.
 This library provides a set of pre-fabricated "flavors" (or "distributions") of tf-serving, each of which is configured for a different use case. These are captured as ksonnet *prototypes*, which allow users to interactively customize these distributions for their specific needs.
 These prototypes, as well as how to use them, are enumerated below.
 ### io.ksonnet.pkg.tf-serving
 TensorFlow serving
 #### Example
 ```shell
 # Expand prototype as a Jsonnet file, place in a file in the
 # `components/` directory. (YAML and JSON are also available.)
 $ ks prototype use io.ksonnet.pkg.tf-serving tf-serving \
  --name YOUR_NAME_HERE \
  --model_path YOUR_MODEL_PATH_HERE
 ```
 #### Parameters
 The available options to pass prototype are:
 * `--name=<name>`: Name to give to each of the components [string]
 * `--model_path=<model_path>`: Path to the model. This can be a GCS path. [string]
 [rootReadme]: https://github.com/ksonnet/mixins
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/parts.yaml
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/parts.yaml
@ -0,0 +1,35 @@
 {
   "name": "tf-serving",
   "apiVersion": "0.0.1",
   "kind": "ksonnet.io/parts",
   "description": "TensorFlow serving is a server for TensorFlow models.\n",
   "author": "kubeflow team <kubeflow-team@google.com>",
   "contributors": [
      {
         "name": "Jeremy Lewi",
         "email": "jlewi@google.com"
      }
   ],
   "repository": {
      "type": "git",
      "url": "https://github.com/kubeflow/kubeflow"
   },
   "bugs": {
      "url": "https://github.com/kubeflow/kubeflow/issues"
   },
   "keywords": [
      "kubeflow",
      "tensorflow",
      "database"
   ],
   "quickStart": {
      "prototype": "io.ksonnet.pkg.tf-serving",
      "componentName": "tf-serving",
      "flags": {
         "name": "tf-serving",
         "namespace": "default"
      },
      "comment": "Run TensorFlow Serving"
   },
   "license": "Apache 2.0"
 }
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-all-features.jsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-all-features.jsonnet
@ -0,0 +1,23 @@
 // @apiVersion 0.1
 // @name io.ksonnet.pkg.tf-serving
 // @description TensorFlow serving
 // @shortDescription A TensorFlow serving deployment
 // @param name string Name to give to each of the components
 local k = import "k.libsonnet";
 // ksonnet appears to require name be a parameter of the prototype which is why we handle it differently.
 local name = import "param://name";
 // updatedParams includes the namespace from env by default.
 local updatedParams = params + env;
 local tfServingBase = import "kubeflow/tf-serving/tf-serving.libsonnet";
 local tfServing = tfServingBase {
  // Override parameters with user supplied parameters.
  params+: updatedParams {
    name: name,
  },
 };
 std.prune(k.core.v1.list.new(tfServing.components))
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-aws.jsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-aws.jsonnet
@ -0,0 +1,61 @@
 // @apiVersion 0.1
 // @name io.ksonnet.pkg.tf-serving-deployment-aws
 // @description TensorFlow serving
 // @shortDescription A TensorFlow serving deployment
 // @param name string Name to give to each of the components
 // @optionalParam numGpus string 0 Number of gpus to use
 // @optionalParam deployHttpProxy string false Whether to deploy http proxy
 // @optionalParam injectIstio string false Whether to inject istio sidecar; should be true or false.
 // @optionalParam enablePrometheus string true Whether to enable prometheus endpoint (requires TF 1.11)
 // @optionalParam modelBasePath string s3://kubeflow-examples-data/mnist The model path
 // @optionalParam modelName string null The model name
 // @optionalParam versionName string v1 The version name
 // @optionalParam defaultCpuImage string tensorflow/serving:1.11.1 The default model server image (cpu)
 // @optionalParam defaultGpuImage string tensorflow/serving:1.11.1-gpu The default model server image (gpu)
 // @optionalParam httpProxyImage string gcr.io/kubeflow-images-public/tf-model-server-http-proxy:v20180723 Http proxy image
 // @optionalParam s3Enable string false Whether to enable S3
 // Following parameters are needed only if s3Enable is true
 // @optionalParam s3SecretName string null Name of the k8s secrets containing S3 credentials
 // @optionalParam s3SecretAccesskeyidKeyName string AWS_ACCESS_KEY_ID Name of the key in the k8s secret containing AWS_ACCESS_KEY_ID
 // @optionalParam s3SecretSecretaccesskeyKeyName string AWS_SECRET_ACCESS_KEY Name of the key in the k8s secret containing AWS_SECRET_ACCESS_KEY
 // @optionalParam s3AwsRegion string us-west-1 S3 region
 // @optionalParam s3UseHttps string true Whether or not to use https
 // @optionalParam s3VerifySsl string true Whether or not to verify https certificates for S3 connections
 // @optionalParam s3Endpoint string s3.us-west-1.amazonaws.com URL for your s3-compatible endpoint
 local k = import "k.libsonnet";
 local deployment = k.apps.v1beta1.deployment;
 local container = deployment.mixin.spec.template.spec.containersType;
 local util = import "kubeflow/tf-serving/util.libsonnet";
 local tfserving = import "kubeflow/tf-serving/tf-serving-template.libsonnet";
 local base = tfserving.new(env, params);
 local tfDeployment = base.tfDeployment +
                     deployment.mapContainers(
                       function(c) {
                         result::
                           c + container.withEnvMixin(
                             if util.toBool(params.s3Enable) then (
                               [
                                 {
                                   name: "AWS_ACCESS_KEY_ID",
                                   valueFrom: { secretKeyRef: { name: params.s3SecretName, key: params.s3SecretAccesskeyidKeyName } },
                                 },
                                 {
                                   name: "AWS_SECRET_ACCESS_KEY",
                                   valueFrom: { secretKeyRef: { name: params.s3SecretName, key: params.s3SecretSecretaccesskeyKeyName } },
                                 },
                                 { name: "AWS_REGION", value: params.s3AwsRegion },
                                 { name: "S3_USE_HTTPS", value: std.toString(params.s3UseHttps) },
                                 { name: "S3_VERIFY_SSL", value: std.toString(params.s3VerifySsl) },
                                 { name: "S3_ENDPOINT", value: params.s3Endpoint },
                               ]
                             ) else [],
                           ),
                       }.result,
                     );
 util.list([
  tfDeployment,
  base.tfservingConfig,
 ],)
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-gcp.jsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-gcp.jsonnet
@ -0,0 +1,61 @@
 // @apiVersion 0.1
 // @name io.ksonnet.pkg.tf-serving-deployment-gcp
 // @description TensorFlow serving
 // @shortDescription A TensorFlow serving deployment
 // @param name string Name to give to each of the components
 // @optionalParam numGpus string 0 Number of gpus to use
 // @optionalParam deployHttpProxy string false Whether to deploy http proxy
 // @optionalParam modelBasePath string gs://kubeflow-examples-data/mnist The model path
 // @optionalParam modelName string null The model name
 // @optionalParam versionName string v1 The version name
 // @optionalParam defaultCpuImage string tensorflow/serving:1.11.1 The default model server image (cpu)
 // @optionalParam defaultGpuImage string tensorflow/serving:1.11.1-gpu The default model server image (gpu)
 // @optionalParam httpProxyImage string gcr.io/kubeflow-images-public/tf-model-server-http-proxy:v20180723 Http proxy image
 // @optionalParam gcpCredentialSecretName string null If not empty, insert the secret credential
 // @optionalParam injectIstio string false Whether to inject istio sidecar; should be true or false.
 // @optionalParam enablePrometheus string true Whether to enable prometheus endpoint (requires TF 1.11)
 local k = import "k.libsonnet";
 local deployment = k.apps.v1beta1.deployment;
 local container = deployment.mixin.spec.template.spec.containersType;
 local util = import "kubeflow/tf-serving/util.libsonnet";
 local tfserving = import "kubeflow/tf-serving/tf-serving-template.libsonnet";
 local base = tfserving.new(env, params);
 local tfDeployment = base.tfDeployment +
                     deployment.mixin.spec.template.spec.withVolumesMixin(
                       if params.gcpCredentialSecretName != "null" then (
                         [{
                           name: "gcp-credentials",
                           secret: {
                             secretName: params.gcpCredentialSecretName,
                           },
                         }]
                       ) else [],
                     ) +
                     deployment.mapContainers(
                       function(c) {
                         result::
                           c + container.withEnvMixin(
                             if params.gcpCredentialSecretName != "null" then (
                               [{
                                 name: "GOOGLE_APPLICATION_CREDENTIALS",
                                 value: "/secret/gcp-credentials/user-gcp-sa.json",
                               }]
                             ) else [],
                           ) +
                           container.withVolumeMountsMixin(
                             if params.gcpCredentialSecretName != "null" then (
                               [{
                                 name: "gcp-credentials",
                                 mountPath: "/secret/gcp-credentials",
                               }]
                             ) else [],
                           ),
                       }.result,
                     );
 util.list([
  tfDeployment,
  base.tfservingConfig,
 ],)
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-service.jsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-service.jsonnet
@ -0,0 +1,16 @@
 // @apiVersion 0.1
 // @name io.ksonnet.pkg.tf-serving-service
 // @description TensorFlow serving
 // @shortDescription A TensorFlow serving model
 // @param name string Name to give to each of the components
 // @optionalParam serviceType string ClusterIP The k8s service type for tf serving.
 // @optionalParam modelName string null The model name
 // @optionalParam trafficRule string v1:100 The traffic rule, in the format of version:percentage,version:percentage,..
 // @optionalParam injectIstio string false Whether to inject istio sidecar; should be true or false.
 // @optionalParam enablePrometheus string true Whether to enable prometheus endpoint (requires TF 1.11)
 local k = import "k.libsonnet";
 local tfservingService = import "kubeflow/tf-serving/tf-serving-service-template.libsonnet";
 local util = import "kubeflow/tf-serving/util.libsonnet";
 tfservingService.new(env, params).all
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-with-request-log.jsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/prototypes/tf-serving-with-request-log.jsonnet
@ -0,0 +1,230 @@
 // @apiVersion 0.1
 // @name io.ksonnet.pkg.tf-serving-request-log
 // @description tf-serving with request logging
 // @shortDescription tf-serving with request logging
 // @param name string Name to give to each of the components
 // @param gcpProject string The gcp project for Bigquery dataset
 // @param dataset string The Bigquery dataset
 // @param table string The Bigquery table
 // @optionalParam modelBasePath string gs://kubeflow-examples-data/mnist The model path
 // @optionalParam modelName string mnist The model name
 local k = import "k.libsonnet";
 local namespace = "kubeflow";
 local appName = import "param://name";
 local image = "gcr.io/kubeflow-images-public/tf-model-server-cpu:v20180327-995786ec";
 local httpProxyImage = "gcr.io/kubeflow-images-public/tf-model-server-http-proxy:v20180723";
 local loggingImage = "gcr.io/kubeflow-images-public/tf-model-server-request-logger:v20180723";
 local gcpSecretName = "user-gcp-sa";
 local service = {
  apiVersion: "v1",
  kind: "Service",
  metadata: {
    labels: {
      app: appName,
    },
    name: appName,
    namespace: namespace,
  },
  spec: {
    ports: [
      {
        name: "grpc-tf-serving",
        port: 9000,
        targetPort: 9000,
      },
      {
        name: "http-tf-serving-proxy",
        port: 8000,
        targetPort: 8000,
      },
    ],
    selector: {
      app: appName,
    },
    type: "ClusterIP",
  },
 };
 local configMap = {
  apiVersion: "v1",
  kind: "ConfigMap",
  metadata: {
    name: appName + "fluentd-config",
    namespace: namespace,
  },
  data: {
    "fluent.conf": std.format(|||
      <source>
        @type tail
        path /tmp/logs/request.log
        pos_file /tmp/logs/request.log.pos
        <parse>
          @type json
        </parse>
        tag dummy
      </source>
      <match dummy>
        @type bigquery_insert
        auth_method application_default
        project %s
        dataset %s
        table %s
        fetch_schema true
      </match>
    |||, [params.gcpProject, params.dataset, params.table]),
  },
 };
 local deployment = {
  apiVersion: "extensions/v1beta1",
  kind: "Deployment",
  metadata: {
    labels: {
      app: appName,
    },
    name: appName,
    namespace: namespace,
  },
  spec: {
    template: {
      metadata: {
        labels: {
          app: appName,
        },
      },
      spec: {
        containers: [
          // ModelServer
          {
            args: [
              "/usr/bin/tensorflow_model_server",
              "--port=9000",
              "--model_name=" + params.modelName,
              "--model_base_path=" + params.modelBasePath,
            ],
            image: image,
            imagePullPolicy: "IfNotPresent",
            name: "model-server",
            ports: [
              {
                containerPort: 9000,
              },
            ],
            resources: {
              limits: {
                cpu: "4",
                memory: "4Gi",
              },
              requests: {
                cpu: "1",
                memory: "1Gi",
              },
            },
          },
          // Http proxy
          {
            name: "http-proxy",
            image: httpProxyImage,
            imagePullPolicy: "Always",
            command: [
              "python",
              "/usr/src/app/server.py",
              "--port=8000",
              "--rpc_port=9000",
              "--rpc_timeout=10.0",
              "--log_request=true",
            ],
            env: [],
            ports: [
              {
                containerPort: 8000,
              },
            ],
            resources: {
              requests: {
                memory: "1Gi",
                cpu: "1",
              },
              limits: {
                memory: "4Gi",
                cpu: "4",
              },
            },
            securityContext: {
              runAsUser: 1000,
              fsGroup: 1000,
            },
            volumeMounts: [
              {
                name: "request-logs",
                mountPath: "/tmp/logs",
              },
            ],
          },
          // TODO(lunkai): use admission controller to inject.
          // Logging container.
          {
            name: "logging",
            image: loggingImage,
            imagePullPolicy: "Always",
            env: [
              { name: "GOOGLE_APPLICATION_CREDENTIALS", value: "/secret/gcp-credentials/key.json" },
            ],
            resources: {
              requests: {
                memory: "250Mi",
                cpu: "0.25",
              },
              limits: {
                memory: "500Mi",
                cpu: "0.5",
              },
            },
            volumeMounts: [
              {
                name: "request-logs",
                mountPath: "/tmp/logs",
              },
              {
                name: "gcp-credentials",
                mountPath: "/secret/gcp-credentials",
              },
              {
                name: "fluentd-config-volume",
                mountPath: "/fluentd/etc/custom",
              },
            ],
          },
        ],
        volumes: [
          {
            name: "gcp-credentials",
            secret: {
              secretName: gcpSecretName,
            },
          },
          {
            name: "request-logs",
            emptyDir: {},
          },
          {
            configMap: {
              name: "fluentd-config",
            },
            name: "fluentd-config-volume",
          },
        ],
      },
    },
  },
 };
 k.core.v1.list.new([
  service,
  deployment,
  configMap,
 ])
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/tests/tf_serving_test.jsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/tests/tf_serving_test.jsonnet
@ -0,0 +1,112 @@
 local tfservingService = import "kubeflow/tf-serving/tf-serving-service-template.libsonnet";
 local tfserving = import "kubeflow/tf-serving/tf-serving-template.libsonnet";
 local params = {
  name: "m",
  serviceType: "ClusterIP",
  modelName: "mnist",
  trafficRule: "v1:100",
  injectIstio: false,
 };
 local istioParams = params {
  injectIstio: true,
 };
 local env = {
  namespace: "kubeflow",
 };
 local deploymentParam = {
  name: "m",
  modelName: "mnist",
  versionName: "v1",
  modelBasePath: "gs://abc",
  numGpus: 0,
  defaultCpuImage: "gcr.io/abc",
  defaultGpuImage: "gcr.io/abc",
  injectIstio: false,
  enablePrometheus: true,
 };
 local gpuParam1 = {
  name: "m",
  modelName: "mnist",
  versionName: "v1",
  modelBasePath: "gs://abc",
  numGpus: 1,
  defaultCpuImage: "gcr.io/abc",
  defaultGpuImage: "gcr.io/abc",
  injectIstio: false,
  enablePrometheus: true,
 };
 local gpuParamString0 = {
  name: "m",
  modelName: "mnist",
  versionName: "v1",
  modelBasePath: "gs://abc",
  numGpus: "0",
  defaultCpuImage: "gcr.io/abc",
  defaultGpuImage: "gcr.io/abc",
  injectIstio: false,
  enablePrometheus: true,
 };
 local gpuParamString1 = {
  name: "m",
  modelName: "mnist",
  versionName: "v1",
  modelBasePath: "gs://abc",
  numGpus: "1",
  defaultCpuImage: "gcr.io/abc",
  defaultGpuImage: "gcr.io/abc",
  injectIstio: false,
  enablePrometheus: true,
 };
 local serviceInstance = tfservingService.new(env, params);
 local istioServiceInstance = tfservingService.new(env, istioParams);
 local deploymentInstance = tfserving.new(env, deploymentParam);
 local gpuInstance = tfserving.new(env, gpuParam1);
 local gpuString0Instance = tfserving.new(env, gpuParamString0);
 local gpuString1Instance = tfserving.new(env, gpuParamString1);
 // This one should only have tfService
 std.assertEqual(
  std.length(serviceInstance.all.items),
  1,
 ) &&
 // This one should have tfService, virtualService, and DestinationRule
 std.assertEqual(
  std.length(istioServiceInstance.all.items),
  3
 ) &&
 std.startsWith(
  deploymentInstance.tfDeployment.spec.template.spec.containers[0].args[4],
  "--monitoring_config_file"
 ) &&
 std.assertEqual(
  deploymentInstance.tfDeployment.spec.template.spec.containers[0].resources.limits,
  { cpu: "4", memory: "4Gi" }
 ) &&
 std.assertEqual(
  gpuInstance.tfDeployment.spec.template.spec.containers[0].resources.limits,
  { cpu: "4", memory: "4Gi", "nvidia.com/gpu": 1 }
 ) &&
 std.assertEqual(
  gpuString0Instance.tfDeployment.spec.template.spec.containers[0].resources.limits,
  { cpu: "4", memory: "4Gi" }
 ) &&
 std.assertEqual(
  gpuString1Instance.tfDeployment.spec.template.spec.containers[0].resources.limits,
  { cpu: "4", memory: "4Gi", "nvidia.com/gpu": 1 }
 )
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/tf-serving-service-template.libsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/tf-serving-service-template.libsonnet
@ -0,0 +1,147 @@
 {
  local k = import "k.libsonnet",
  local util = import "kubeflow/tf-serving/util.libsonnet",
  new(_env, _params):: {
    local params = _params + _env,
    local namespace = params.namespace,
    local name = params.name,
    local modelName =
      if params.modelName == "null" then
        params.name
      else
        params.modelName,
    local tfService = {
      apiVersion: "v1",
      kind: "Service",
      metadata: {
        labels: {
          app: modelName,
        },
        name: name,
        namespace: namespace,
        annotations: {
          "getambassador.io/config":
            std.join("\n", [
              "---",
              "apiVersion: ambassador/v0",
              "kind:  Mapping",
              "name: tfserving-predict-mapping-" + modelName,
              "prefix: /tfserving/models/" + modelName,
              "rewrite: /v1/models/" + modelName + ":predict",
              "method: POST",
              "service: " + name + "." + namespace + ":8500",
              "---",
              "apiVersion: ambassador/v0",
              "kind:  Mapping",
              "name: tfserving-predict-mapping-" + modelName + "-get",
              "prefix: /tfserving/models/" + modelName,
              "rewrite: /v1/models/" + modelName,
              "method: GET",
              "service: " + name + "." + namespace + ":8500",
            ]),
        } + if util.toBool(params.enablePrometheus) then {
          "prometheus.io/scrape": "true",
          "prometheus.io/path": "/monitoring/prometheus/metrics",
          "prometheus.io/port": "8500",
        } else {},  //annotations
      },
      spec: {
        ports: [
          {
            name: "grpc-tf-serving",
            port: 9000,
            targetPort: 9000,
          },
          {
            name: "http-tf-serving",
            port: 8500,
            targetPort: 8500,
          },
        ],
        selector: {
          app: modelName,
        },
        type: params.serviceType,
      },
    },  // tfService
    tfService:: tfService,
    local versionWeights = std.split(params.trafficRule, ","),
    local virtualService = {
      apiVersion: "networking.istio.io/v1alpha3",
      kind: "VirtualService",
      metadata: {
        name: name,
        namespace: namespace,
      },
      spec: {
        hosts: [
          "*",
        ],
        gateways: [
          "kubeflow-gateway",
        ],
        http: [
          {
            match: [
              {
                uri: {
                  prefix: "/istio/tfserving/models/" + modelName,
                },
                method: {
                  exact: "POST",
                },
              },
            ],
            rewrite: {
              uri: "/v1/models/" + modelName + ":predict",
            },
            route: [
              {
                destination: {
                  host: name,
                  port: {
                    number: 8500,
                  },
                  subset: std.split(versionWeight, ":")[0],
                },
                weight: std.parseInt(std.split(versionWeight, ":")[1]),
              }
              for versionWeight in versionWeights
            ],
          },
        ],
      },
    },
    virtualService:: virtualService,
    local destinationRule = {
      apiVersion: "networking.istio.io/v1alpha3",
      kind: "DestinationRule",
      metadata: {
        name: name,
        namespace: namespace,
      },
      spec: {
        host: name,
        subsets: [
          {
            name: std.split(versionWeight, ":")[0],
            labels: {
              version: std.split(versionWeight, ":")[0],
            },
          }
          for versionWeight in versionWeights
        ],
      },
    },
    destinationRule:: destinationRule,
    all:: util.list([
      tfService,
    ] + if util.toBool(params.injectIstio) then [
      virtualService,
      destinationRule,
    ] else []),
  },  // new
 }
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/tf-serving-template.libsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/tf-serving-template.libsonnet
@ -0,0 +1,137 @@
 {
  local k = import "k.libsonnet",
  local util = import "kubeflow/tf-serving/util.libsonnet",
  new(_env, _params):: {
    local params = _params + _env,
    local namespace = params.namespace,
    local name = params.name,
    local modelName =
      if params.modelName == "null" then
        params.name
      else
        params.modelName,
    local versionName = params.versionName,
    local numGpus =
      if std.type(params.numGpus) == "string" then
        std.parseInt(params.numGpus)
      else
        params.numGpus,
    local modelServerImage =
      if numGpus == 0 then
        params.defaultCpuImage
      else
        params.defaultGpuImage,
    // Optional features.
    // TODO(lunkai): Add request logging
    local modelServerContainer = {
      command: [
        "/usr/bin/tensorflow_model_server",
      ],
      args: [
        "--port=9000",
        "--rest_api_port=8500",
        "--model_name=" + modelName,
        "--model_base_path=" + params.modelBasePath,
      ] + if util.toBool(params.enablePrometheus) then [
        "--monitoring_config_file=/var/config/monitoring_config.txt",
      ] else [],
      image: modelServerImage,
      imagePullPolicy: "IfNotPresent",
      name: modelName,
      ports: [
        {
          containerPort: 9000,
        },
        {
          containerPort: 8500,
        },
      ],
      env: [],
      resources: {
        limits: {
          cpu: "4",
          memory: "4Gi",
        } + if numGpus != 0 then {
          "nvidia.com/gpu": numGpus,
        } else {},
        requests: {
          cpu: "1",
          memory: "1Gi",
        },
      },
      volumeMounts: [
        {
          mountPath: "/var/config/",
          name: "config-volume",
        },
      ],
      // TCP liveness probe on gRPC port
      livenessProbe: {
        tcpSocket: {
          port: 9000,
        },
        initialDelaySeconds: 30,
        periodSeconds: 30,
      },
    },  // modelServerContainer
    local tfDeployment = {
      apiVersion: "extensions/v1beta1",
      kind: "Deployment",
      metadata: {
        labels: {
          app: modelName,
        },
        name: name,
        namespace: namespace,
      },
      spec: {
        template: {
          metadata: {
            labels: {
              app: modelName,
              version: versionName,
            },
            annotations: {
              "sidecar.istio.io/inject": if util.toBool(params.injectIstio) then "true",
            },
          },
          spec: {
            containers: [
              modelServerContainer,
            ],
            volumes: [
              {
                configMap: {
                  name: name + "-config",
                },
                name: "config-volume",
              },
            ],
          },
        },
      },
    },  // tfDeployment
    tfDeployment:: tfDeployment,
    local tfservingConfig = {
      apiVersion: "v1",
      kind: "ConfigMap",
      metadata: {
        name: name + "-config",
        namespace: namespace,
      },
      data: {
        "monitoring_config.txt": std.join("\n", [
          "prometheus_config: {",
          "  enable: true,",
          '  path: "/monitoring/prometheus/metrics"',
          "}",
        ]),
      },
    },  // tfservingConfig
    tfservingConfig:: tfservingConfig,
  },  // new
 }
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/tf-serving.libsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/tf-serving.libsonnet
@ -0,0 +1,380 @@
 {
  util:: import "kubeflow/tf-serving/util.libsonnet",
  // Parameters are intended to be late bound.
  params:: {
    name: null,
    numGpus: 0,
    labels: {
      app: $.params.name,
    },
    modelName: $.params.name,
    modelPath: null,
    modelStorageType: "storageType",
    version: "v1",
    firstVersion: true,
    deployIstio: false,
    deployHttpProxy: false,
    httpProxyImage: "gcr.io/kubeflow-images-public/tf-model-server-http-proxy:v20180606-9dfda4f2",
    serviceType: "ClusterIP",
    // If users want to override the image then can override defaultCpuImage and/or defaultGpuImage
    // in which case the image used will still depend on whether GPUs are used or not.
    // Users can also override modelServerImage in which case the user supplied value will always be used
    // regardless of numGpus.
    defaultCpuImage: "tensorflow/serving:1.11.1",
    defaultGpuImage: "tensorflow/serving:1.11.1-gpu",
    modelServerImage: if $.params.numGpus == 0 then
      $.params.defaultCpuImage
    else
      $.params.defaultGpuImage,
    // Whether or not to enable s3 parameters
    s3Enable:: false,
    // Which storageType to use
    storageType:: null,
  },
  // Parametes specific to GCP.
  gcpParams:: {
    gcpCredentialSecretName: "",
  } + $.params,
  // Parameters that control S3 access
  // params overrides s3params because params can be overwritten by the user to override the defaults.
  s3params:: {
    //  Name of the k8s secrets containing S3 credentials
    s3SecretName: "",
    // Name of the key in the k8s secret containing AWS_ACCESS_KEY_ID.
    s3SecretAccesskeyidKeyName: "AWS_ACCESS_KEY_ID",
    // Name of the key in the k8s secret containing AWS_SECRET_ACCESS_KEY.
    s3SecretSecretaccesskeyKeyName: "AWS_SECRET_ACCESS_KEY",
    // S3 region
    s3AwsRegion: "us-west-1",
    // TODO(jlewi): We should use util.toBool to automatically conver to actual boolean values.
    // The use of strings is left over from when they were prototype parameters which only supports string type.
    // true Whether or not to use https for S3 connections
    s3UseHttps: "true",
    // Whether or not to verify https certificates for S3 connections
    s3VerifySsl: "true",
    // URL for your s3-compatible endpoint.
    s3Endpoint: "http://s3.us-west-1.amazonaws.com,",
  } + $.params,
  components:: {
    all:: [
            // Default routing rule for the first version of model.
            if $.util.toBool($.params.deployIstio) && $.util.toBool($.params.firstVersion) then
              $.parts.defaultRouteRule,
          ] +
          // TODO(jlewi): It would be better to structure s3 as a mixin.
          // As an example it would be great to allow S3 and GCS parameters
          // to be enabled simultaneously. This should be doable because
          // each entails adding a set of environment variables and volumes
          // to the containers. These volumes/environment variables shouldn't
          // overlap so there's no reason we shouldn't be able to just add
          // both modifications to the base container.
          // I think we want to restructure things as mixins so they can just
          // be added.
          if $.params.s3Enable then
            [
              $.s3parts.tfService,
              $.s3parts.tfDeployment,
            ]
          else if $.params.storageType == "gcp" then
            [
              $.gcpParts.tfService,
              $.gcpParts.tfDeployment,
            ]
          else
            [
              $.parts.tfService,
              $.parts.tfDeployment,
            ],
  }.all,
  parts:: {
    // We define the containers one level beneath parts because combined with jsonnet late binding
    // this makes it easy for users to override specific bits of the container.
    tfServingContainerBase:: {
      name: $.params.name,
      image: $.params.modelServerImage,
      imagePullPolicy: "IfNotPresent",
      command: [
        "/usr/bin/tensorflow_model_server",
      ],
      args: [
        "--port=9000",
        "--model_name=" + $.params.modelName,
        "--model_base_path=" + $.params.modelPath,
      ],
      ports: [
        {
          containerPort: 9000,
        },
      ],
      // TODO(jlewi): We should add readiness and liveness probes. I think the blocker is that
      // model-server doesn't have something we can use out of the box.
      resources: {
        requests: {
          memory: "1Gi",
          cpu: "1",
        },
        limits: {
          memory: "4Gi",
          cpu: "4",
        },
      },
      // The is user and group should be defined in the Docker image.
      // Per best practices we don't run as the root user.
      securityContext: {
        runAsUser: 1000,
        fsGroup: 1000,
      },
      volumeMounts+: if $.params.modelStorageType == "nfs" then [{
        name: "nfs",
        mountPath: "/mnt",
      }]
      else [],
    },  // tfServingContainer
    tfServingContainer+: $.parts.tfServingContainerBase +
                         if $.params.numGpus > 0 then
                           {
                             resources+: {
                               limits+: {
                                 "nvidia.com/gpu": $.params.numGpus,
                               },
                             },
                           }
                         else {},
    tfServingMetadata+: {
      labels: $.params.labels { version: $.params.version },
      annotations: {
        "sidecar.istio.io/inject": if $.util.toBool($.params.deployIstio) then "true",
      },
    },
    httpProxyContainer:: {
      name: $.params.name + "-http-proxy",
      image: $.params.httpProxyImage,
      imagePullPolicy: "IfNotPresent",
      command: [
        "python",
        "/usr/src/app/server.py",
        "--port=8000",
        "--rpc_port=9000",
        "--rpc_timeout=10.0",
      ],
      env: [],
      ports: [
        {
          containerPort: 8000,
        },
      ],
      resources: {
        requests: {
          memory: "500Mi",
          cpu: "0.5",
        },
        limits: {
          memory: "1Gi",
          cpu: "1",
        },
      },
      securityContext: {
        runAsUser: 1000,
        fsGroup: 1000,
      },
    },  // httpProxyContainer
    tfDeployment: {
      apiVersion: "extensions/v1beta1",
      kind: "Deployment",
      metadata: {
        name: $.params.name + "-" + $.params.version,
        namespace: $.params.namespace,
        labels: $.params.labels,
      },
      spec: {
        template: {
          metadata: $.parts.tfServingMetadata,
          spec: {
            containers: [
              $.parts.tfServingContainer,
              if $.util.toBool($.params.deployHttpProxy) then
                $.parts.httpProxyContainer,
            ],
            volumes+: if $.params.modelStorageType == "nfs" then
              [{
                name: "nfs",
                persistentVolumeClaim: {
                  claimName: $.params.nfsPVC,
                },
              }]
            else [],
          },
        },
      },
    },  // tfDeployment
    tfService: {
      apiVersion: "v1",
      kind: "Service",
      metadata: {
        labels: $.params.labels,
        name: $.params.name,
        namespace: $.params.namespace,
        annotations: {
          "getambassador.io/config":
            std.join("\n", [
              "---",
              "apiVersion: ambassador/v0",
              "kind:  Mapping",
              "name: tfserving-mapping-" + $.params.name + "-get",
              "prefix: /models/" + $.params.name + "/",
              "rewrite: /",
              "method: GET",
              "service: " + $.params.name + "." + $.params.namespace + ":8000",
              "---",
              "apiVersion: ambassador/v0",
              "kind:  Mapping",
              "name: tfserving-mapping-" + $.params.name + "-post",
              "prefix: /models/" + $.params.name + "/",
              "rewrite: /model/" + $.params.name + ":predict",
              "method: POST",
              "service: " + $.params.name + "." + $.params.namespace + ":8000",
            ]),
        },  //annotations
      },
      spec: {
        ports: [
          {
            name: "grpc-tf-serving",
            port: 9000,
            targetPort: 9000,
          },
          {
            name: "http-tf-serving-proxy",
            port: 8000,
            targetPort: 8000,
          },
        ],
        selector: $.params.labels,
        type: $.params.serviceType,
      },
    },  // tfService
    defaultRouteRule: {
      apiVersion: "config.istio.io/v1alpha2",
      kind: "RouteRule",
      metadata: {
        name: $.params.name + "-default",
        namespace: $.params.namespace,
      },
      spec: {
        destination: {
          name: $.params.name,
        },
        precedence: 0,
        route: [
          {
            labels: { version: $.params.version },
          },
        ],
      },
    },
  },  // parts
  // Parts specific to S3
  s3parts:: $.parts {
    s3Env:: [
      { name: "AWS_ACCESS_KEY_ID", valueFrom: { secretKeyRef: { name: $.s3params.s3SecretName, key: $.s3params.s3SecretAccesskeyidKeyName } } },
      { name: "AWS_SECRET_ACCESS_KEY", valueFrom: { secretKeyRef: { name: $.s3params.s3SecretName, key: $.s3params.s3SecretSecretaccesskeyKeyName } } },
      { name: "AWS_REGION", value: $.s3params.s3AwsRegion },
      { name: "S3_REGION", value: $.s3params.s3AwsRegion },
      { name: "S3_USE_HTTPS", value: $.s3params.s3UseHttps },
      { name: "S3_VERIFY_SSL", value: $.s3params.s3VerifySsl },
      { name: "S3_ENDPOINT", value: $.s3params.s3Endpoint },
    ],
    tfServingContainer: $.parts.tfServingContainer {
      env+: $.s3parts.s3Env,
    },
    tfDeployment: $.parts.tfDeployment {
      spec: +{
        template: +{
          metadata: $.parts.tfServingMetadata,
          spec: +{
            containers: [
              $.s3parts.tfServingContainer,
              if $.util.toBool($.params.deployHttpProxy) then
                $.parts.httpProxyContainer,
            ],
          },
        },
      },
    },  // tfDeployment
  },  // s3parts
  // Parts specific to GCP
  gcpParts:: $.parts {
    gcpEnv:: [
      if $.gcpParams.gcpCredentialSecretName != "" then
        { name: "GOOGLE_APPLICATION_CREDENTIALS", value: "/secret/gcp-credentials/user-gcp-sa.json" },
    ],
    tfServingContainer: $.parts.tfServingContainer {
      env+: $.gcpParts.gcpEnv,
      volumeMounts+: [
        if $.gcpParams.gcpCredentialSecretName != "" then
          {
            name: "gcp-credentials",
            mountPath: "/secret/gcp-credentials",
          },
      ],
    },
    tfDeployment: $.parts.tfDeployment {
      spec+: {
        template+: {
          metadata: $.parts.tfServingMetadata,
          spec+: {
            containers: [
              $.gcpParts.tfServingContainer,
              if $.util.toBool($.params.deployHttpProxy) then
                $.parts.httpProxyContainer,
            ],
            volumes: [
              if $.gcpParams.gcpCredentialSecretName != "" then
                {
                  name: "gcp-credentials",
                  secret: {
                    secretName: $.gcpParams.gcpCredentialSecretName,
                  },
                },
            ],
          },
        },
      },
    },  // tfDeployment
  },  // gcpParts
 }
--- a/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/util.libsonnet
+++ b/mnist/ks_app/vendor/kubeflow/tf-serving@fed535eaa276220e4edf59530c0629f4375a40a9/util.libsonnet
@ -0,0 +1,21 @@
 // Some useful routines.
 {
  local k = import "k.libsonnet",
  // Convert non-boolean types like string,number to a boolean.
  // This is primarily intended for dealing with parameters that should be booleans.
  toBool:: function(x) {
    result::
      if std.type(x) == "boolean" then
        x
      else if std.type(x) == "string" then
        std.asciiUpper(x) == "TRUE"
      else if std.type(x) == "number" then
        x != 0
      else
        false,
  }.result,
  // Produce a list of manifests. obj must be an array
  list(obj):: k.core.v1.list.new(obj,),
 }
--- a/mnist/model.py
+++ b/mnist/model.py
@ -21,6 +21,7 @@ from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 import json
 import os
 import sys
 import numpy as np
@ -126,6 +127,22 @@ def linear_serving_input_receiver_fn():
 def main(_):
  tf.logging.set_verbosity(tf.logging.INFO)
  tf_config = os.environ.get('TF_CONFIG', '{}')
  tf.logging.info("TF_CONFIG %s", tf_config)
  tf_config_json = json.loads(tf_config)
  cluster = tf_config_json.get('cluster')
  job_name = tf_config_json.get('task', {}).get('type')
  task_index = tf_config_json.get('task', {}).get('index')
  tf.logging.info("cluster=%s job_name=%s task_index=%s", cluster, job_name,
                  task_index)
  is_chief = False
  if not job_name or job_name.lower() in ["chief", "master"]:
    is_chief = True
    tf.logging.info("Will export model")
  else:
    tf.logging.info("Will not export model")
  # Download and load MNIST dataset.
  mnist = tf.contrib.learn.datasets.DATASETS['mnist'](TF_DATA_DIR)
  train_input_fn = tf.estimator.inputs.numpy_input_fn(
@ -151,6 +168,8 @@ def main(_):
    classifier = tf.estimator.LinearClassifier(
        feature_columns=feature_columns, n_classes=N_DIGITS,
        model_dir=TF_MODEL_DIR, config=training_config)
    # TODO(jlewi): Should it be linear_serving_input_receiver_fn here?
    serving_fn = cnn_serving_input_receiver_fn
    export_final = tf.estimator.FinalExporter(
        TF_EXPORT_DIR, serving_input_receiver_fn=cnn_serving_input_receiver_fn)
@ -158,6 +177,7 @@ def main(_):
    # Convolutional network
    classifier = tf.estimator.Estimator(
        model_fn=conv_model, model_dir=TF_MODEL_DIR, config=training_config)
    serving_fn = cnn_serving_input_receiver_fn
    export_final = tf.estimator.FinalExporter(
        TF_EXPORT_DIR, serving_input_receiver_fn=cnn_serving_input_receiver_fn)
  else:
@ -171,7 +191,14 @@ def main(_):
                                      exporters=export_final,
                                      throttle_secs=1,
                                      start_delay_secs=1)
  print("Train and evaluate")
  tf.estimator.train_and_evaluate(classifier, train_spec, eval_spec)
  print("Training done")
  if is_chief:
    print("Export saved model")
    classifier.export_savedmodel(TF_EXPORT_DIR, serving_input_receiver_fn=serving_fn)
    print("Done exporting the model")
 if __name__ == '__main__':
  tf.app.run()
--- a/mnist/testing/deploy_test.py
+++ b/mnist/testing/deploy_test.py
@ -0,0 +1,76 @@
 """Test deploying the mnist model.
 This file tests that we can deploy the model.
 TODO(jlewi): Test that we can send predictions to the model.
 It is an integration test as it depends on having access to
 a Kubeflow deployment to deploy on. It also depends on having a model.
 Python Path Requirements:
  kubeflow/testing/py - https://github.com/kubeflow/testing/tree/master/py
     * Provides utilities for testing
 Manually running the test
 1. Configure your KUBECONFIG file to point to the desired cluster
 2. Set --params=name=${NAME},namespace=${NAMESPACE}
    * name should be the name for your job
    * namespace should be the namespace to use
 3. Use the modelBasePath parameter to the model to test.
     --params=...,modelBasePath=${MODEL_BASE_PATH}
 """
 import logging
 import os
 from kubernetes import client as k8s_client
 from py import test_runner
 from kubeflow.testing import ks_util
 from kubeflow.testing import test_util
 from kubeflow.testing import util
 class MnistDeployTest(test_util.TestCase):
  def __init__(self, args):
    namespace, name, env = test_runner.parse_runtime_params(args)
    self.app_dir = args.app_dir
    if not self.app_dir:
      self.app_dir = os.path.join(os.path.dirname(__file__), "..",
                                  "ks_app")
      self.app_dir = os.path.abspath(self.app_dir)
      logging.info("--app_dir not set defaulting to: %s", self.app_dir)
    self.env = env
    self.namespace = namespace
    self.params = args.params
    self.ks_cmd = ks_util.get_ksonnet_cmd(self.app_dir)
    super(MnistDeployTest, self).__init__(class_name="MnistDeployTest",
                                          name=name)
  def test_serve(self):
    # We repeat the test multiple times.
    # This ensures that if we delete the job we can create a new job with the
    # same name.
    api_client = k8s_client.ApiClient()
    # Apply the components
    for component in ["mnist-deploy-gcp", "mnist-service"]:
      # Setup the ksonnet app
      ks_util.setup_ks_app(self.app_dir, self.env, self.namespace, component,
                           self.params)
      util.run([self.ks_cmd, "apply", self.env, "-c", component],
               cwd=self.app_dir)
      logging.info("Created deployment %s in namespaces %s", self.name, self.namespace)
    util.wait_for_deployment(api_client, self.namespace, self.name,
                             timeout_minutes=4)
    # We don't delete the resources. We depend on the namespace being
    # garbage collected.
 if __name__ == "__main__":
  test_runner.main(module=__name__)
--- a/test/copy_secret.sh
+++ b/test/copy_secret.sh
@ -0,0 +1,33 @@
 #!/bin/bash
 #
 # A simple script to copy a secret from 1 namespace to another
 #
 # Usage 
 # copy_secret <source namepspace> <dest namespace> <secret name>
 set -e
 SOURCE=$1
 DEST=$2
 NAME=$3
 usage() {
 	echo copy_secret "<source namepspace> <dest namespace> <secret name>"
 }
 if [ -z ${SOURCE} ]; then
 	usage
 	exit -1
 fi
 if [ -z ${DEST} ]; then
 	usage
 	exit -1
 fi
 if [ -z ${NAME} ]; then
 	usage
 	exit -1
 fi
 echo getting secret
 SECRET=$(kubectl -n ${SOURCE} get secrets user-gcp-sa -o jsonpath="{.data.${NAME}\.json}" | base64 -d)
 kubectl create -n ${DEST} secret generic ${NAME} --from-literal="${NAME}.json=${SECRET}"
--- a/test/workflows/components/mnist.jsonnet
+++ b/test/workflows/components/mnist.jsonnet
@ -25,6 +25,12 @@ local defaultParams = {
  // The bucket where the model should be written
  // This needs to be writable by the GCP service account in the Kubeflow cluster (not the test cluster)
  modelBucket: "kubeflow-ci_temp",
  // Whether to delete the namespace at the end.
  // Leaving the namespace around can be useful for debugging.
  //
  // TODO(jlewi): We should consider running a cronjob to GC so namespaces.
  deleteNamespace: false,
 };
 local params = defaultParams + overrides;
@ -77,6 +83,9 @@ local modelDir = "gs://" + params.modelBucket + "/mnist/models/" + prowDict["BUI
 // value of KUBECONFIG environment variable. This should be  a full path.
 local kubeConfig = testDir + "/.kube/kubeconfig";
 // Namespace where tests should run
 local testNamespace = "mnist-" + prowDict["BUILD_ID"];
 // Build template is a template for constructing Argo step templates.
 //
 // step_name: Name for the template
@ -233,10 +242,48 @@ local dagTemplates = [
        params.kfCluster,
      ]]
      ),
      workingDir: srcDir + "/github_issue_summarization",
    },
    dependencies: ["checkout"],
  }, // get-kubeconfig
  {
    // Create the namespace
    // TODO(jlewi): We should add some sort of retry.
    template: buildTemplate {
      name: "create-namespace",
      command: util.buildCommand([
      [
        "echo",
        "KUBECONFIG=",
        "${KUBECONFIG}",
      ],
      [
        "gcloud",
        "auth",
        "activate-service-account",
        "--key-file=${GOOGLE_APPLICATION_CREDENTIALS}",
      ],
      [
        "kubectl",
        "config" ,
        "current-context",
      ],
      [
        "kubectl",
        "create",
        "namespace",
        testNamespace,
      ],
      # Copy the GCP secret from the kubeflow namespace to the test namespace
      [
        srcDir + "/test/copy_secret.sh",
        "kubeflow",
        testNamespace,
        "user-gcp-sa",
      ]]
      ),
    },
    dependencies: ["get-kubeconfig"],
  }, // create-namespace
  {
    // Run the python test for TFJob
    template: buildTemplate {
@ -247,7 +294,7 @@ local dagTemplates = [
        "--artifacts_path=" + artifactsDir,
        "--params=" + std.join(",", [
          "name=mnist-test-" + prowDict["BUILD_ID"], 
-          "namespace=kubeflow",
+          "namespace=" + testNamespace,
          "numTrainSteps=10",
          "batchSize=10",
          "image=" + trainerImage,
@ -260,8 +307,25 @@ local dagTemplates = [
      ])],
      workingDir: srcDir + "/mnist/testing",
    },
-    dependencies: ["build-images", "get-kubeconfig"],
+    dependencies: ["build-images", "create-namespace"],
  },  // tfjob-test
  {
    // Run the python test for TFJob
    template: buildTemplate {
      name: "deploy-test",
      command: [
        "python",
        "deploy_test.py",        
        "--params=" + std.join(",", [
          "name=mnist-test-" + prowDict["BUILD_ID"], 
          "namespace=" + testNamespace,          
          "modelBasePath=" + modelDir  + "/export",
          "exportDir=" + modelDir,
      ])],
      workingDir: srcDir + "/mnist/testing",
    },
    dependencies: ["tfjob-test"],
  },  // deploy-test
  // TODO(jlewi): We should add a non-distributed test that just uses the default values.
 ];
@ -277,8 +341,35 @@ local dag = {
 // Define templates for the steps to be performed when the
 // test exits
 local deleteTemplates = if params.deleteNamespace then
 [
    {
      // Delete the namespace
      // TODO(jlewi): We should add some sort of retry.
      template: buildTemplate {
        name: "delete-namespace",
        command: util.buildCommand([
        [
          "gcloud",
          "auth",
          "activate-service-account",
          "--key-file=${GOOGLE_APPLICATION_CREDENTIALS}",
        ],
        [
          "kubectl",
          "delete",
          "namespace",
          testNamespace,
        ]]
        ),
      },
    }, // delete-namespace
  ] else [];
 local exitTemplates =
-  [
+  deleteTemplates +
  [  
    {
      // Copy artifacts to GCS for gubernator.
      // TODO(https://github.com/kubeflow/testing/issues/257): Create-pr-symlink
@ -294,7 +385,6 @@ local exitTemplates =
          "--bucket=" + bucket,
        ],
      },  // copy-artifacts,
    },
    {
      // Delete the test directory in NFS.
@ -314,7 +404,7 @@ local exitTemplates =
        	  },
          },
        },  // test-dir-delete
-      dependencies: ["copy-artifacts"],
+      dependencies: ["copy-artifacts"] + if params.deleteNamespace then ["delete-namespace"] else [],
    },
  ];
--- a/test/workflows/environments/test/params.libsonnet
+++ b/test/workflows/environments/test/params.libsonnet
@ -14,8 +14,8 @@ local envParams = params + {
    },
    mnist+: {
      namespace: 'kubeflow-test-infra',
-      name: 'jlewi-mnist-test-465-0109-050605',
+      name: 'jlewi-mnist-test-469-0111-081531',
-      prow_env: 'JOB_NAME=mnist-test,JOB_TYPE=presubmit,REPO_NAME=examples,REPO_OWNER=kubeflow,BUILD_NUMBER=0109-050605,BUILD_ID=0109-050605,PULL_NUMBER=465',
+      prow_env: 'JOB_NAME=mnist-test,JOB_TYPE=presubmit,REPO_NAME=examples,REPO_OWNER=kubeflow,BUILD_NUMBER=0111-081531,BUILD_ID=0111-081531,PULL_NUMBER=469',
    },
  },
 };