From e61671d16b9f1d964a1344207444af74eec0ca94 Mon Sep 17 00:00:00 2001 From: jeffluoo Date: Mon, 24 Feb 2025 20:11:01 +0000 Subject: [PATCH] docs: add example for inference extension Hold until https://github.com/GoogleCloudPlatform/monitoring-dashboard-samples/pull/929 is submitted and public page is generated. --- examples/inference-extension/README.md | 3 ++ .../inference-extension/pod-monitoring.yaml | 30 +++++++++++++++++++ 2 files changed, 33 insertions(+) create mode 100644 examples/inference-extension/README.md create mode 100644 examples/inference-extension/pod-monitoring.yaml diff --git a/examples/inference-extension/README.md b/examples/inference-extension/README.md new file mode 100644 index 0000000000..5f080be106 --- /dev/null +++ b/examples/inference-extension/README.md @@ -0,0 +1,3 @@ +# Inference Extension sample manifests + +Please refer to the [Google Cloud documentation](https://cloud.google.com/stackdriver/docs/managed-prometheus/exporters/inference-extension) for how to use these manifests. diff --git a/examples/inference-extension/pod-monitoring.yaml b/examples/inference-extension/pod-monitoring.yaml new file mode 100644 index 0000000000..a135b67653 --- /dev/null +++ b/examples/inference-extension/pod-monitoring.yaml @@ -0,0 +1,30 @@ +# Copyright 2025 Google LLC +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# https://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +apiVersion: monitoring.googleapis.com/v1 +kind: PodMonitoring +metadata: + name: inference-extension + labels: + app.kubernetes.io/name: inference-gateway + app.kubernetes.io/part-of: google-cloud-managed-prometheus +spec: + endpoints: + - port: metrics + scheme: http + interval: 5s + path: /metrics + selector: + matchLabels: + app: inference-gateway-ext-proc