|
10 | 10 | | triton.command | list | `["/bin/sh","-c"]` | Command and arguments to run in Triton container | |
11 | 11 | | triton.args[0] | string | `"/opt/tritonserver/bin/tritonserver \\\n--model-repository=/tmp/ \\\n--log-verbose=0 \\\n--exit-timeout-secs=60\n"` | | |
12 | 12 | | triton.resources | object | `{"limits":{"cpu":1,"memory":"2G"},"requests":{"cpu":1,"memory":"2G"}}` | Resource limits and requests for each Triton instance. You can add necessary GPU request here. | |
| 13 | +| triton.annotations | object | `{}` | Annotations for Triton pods | |
| 14 | +| triton.nodeSelector | object | `{}` | Node selector for Triton pods | |
| 15 | +| triton.tolerations | list | `[]` | Tolerations for Triton pods | |
13 | 16 | | triton.affinity | object | `{}` | Affinity rules for Triton pods - another way to request GPUs | |
14 | 17 | | triton.modelRepository | object | `{"enabled":false,"mountPath":""}` | Model repository configuration | |
15 | 18 | | triton.modelRepository.mountPath | string | `""` | Model repository mount path | |
|
25 | 28 | | envoy.image | string | `"envoyproxy/envoy:v1.30.9"` | Envoy Proxy Docker image | |
26 | 29 | | envoy.args | list | `["--config-path","/etc/envoy/envoy.yaml","--log-level","info","--log-path","/dev/stdout"]` | Arguments for Envoy | |
27 | 30 | | envoy.resources | object | `{"limits":{"cpu":8,"memory":"4G"},"requests":{"cpu":1,"memory":"2G"}}` | Resource requests and limits for Envoy Proxy. Note: an Envoy Proxy with too many connections might run out of CPU | |
| 31 | +| envoy.annotations | object | `{}` | Annotations for Envoy pods | |
| 32 | +| envoy.nodeSelector | object | `{}` | Node selector for Envoy pods | |
| 33 | +| envoy.tolerations | list | `[]` | Tolerations for Envoy pods | |
28 | 34 | | envoy.service.type | string | `"ClusterIP"` | This is the client-facing endpoint. In order to be able to connect to it, either enable ingress, or use type: LoadBalancer. | |
29 | 35 | | envoy.service.ports | list | `[{"name":"grpc","port":8001,"targetPort":8001},{"name":"admin","port":9901,"targetPort":9901}]` | Envoy Service ports | |
30 | 36 | | envoy.ingress | object | `{"annotations":{},"enabled":false,"hostName":"","ingressClassName":""}` | Ingress configuration for Envoy | |
|
54 | 60 | | autoscaler.scaleDown.stabilizationWindowSeconds | int | `600` | | |
55 | 61 | | autoscaler.scaleDown.periodSeconds | int | `120` | | |
56 | 62 | | autoscaler.scaleDown.stepsize | int | `1` | | |
57 | | -| nodeSelector | object | `{}` | Node selector for all pods (Triton and Envoy) | |
58 | | -| tolerations | list | `[]` | Tolerations for all pods (Triton and Envoy) | |
59 | 63 | | prometheus.external.enabled | bool | `false` | Enable external Prometheus instance. If true, Prometheus parameters outside of prometheus.external will be ignored. | |
60 | 64 | | prometheus.external.url | string | `""` | External Prometheus server url | |
61 | 65 | | prometheus.external.port | int | `443` | External Prometheus server port number | |
|
0 commit comments