diff --git a/docs/admin/code-hosts/aws-codecommit.mdx b/docs/admin/code-hosts/aws-codecommit.mdx
index 45bb54f32..0e68adef1 100644
--- a/docs/admin/code-hosts/aws-codecommit.mdx
+++ b/docs/admin/code-hosts/aws-codecommit.mdx
@@ -37,7 +37,7 @@ AWS CodeCommit connections support the following configuration options, which ar
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/aws_codecommit.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 	// REQUIRED:
diff --git a/docs/admin/code-hosts/azuredevops.mdx b/docs/admin/code-hosts/azuredevops.mdx
index 08f4c56e2..3e2b37db0 100644
--- a/docs/admin/code-hosts/azuredevops.mdx
+++ b/docs/admin/code-hosts/azuredevops.mdx
@@ -65,7 +65,7 @@ Azure DevOps connections support the following configuration options, which are
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/azuredevops.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 	// Authentication alternatives: token OR windowsPassword
 
diff --git a/docs/admin/code-hosts/bitbucket-cloud.mdx b/docs/admin/code-hosts/bitbucket-cloud.mdx
index 8349f8ef6..2b62143cc 100644
--- a/docs/admin/code-hosts/bitbucket-cloud.mdx
+++ b/docs/admin/code-hosts/bitbucket-cloud.mdx
@@ -116,7 +116,7 @@ Bitbucket Cloud connections support the following configuration options, which a
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/bitbucket_cloud.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 	// The workspace access token to use when authenticating with Bitbucket Cloud.
diff --git a/docs/admin/code-hosts/bitbucket-server.mdx b/docs/admin/code-hosts/bitbucket-server.mdx
index 01f1bd272..035e6b4ce 100644
--- a/docs/admin/code-hosts/bitbucket-server.mdx
+++ b/docs/admin/code-hosts/bitbucket-server.mdx
@@ -202,7 +202,7 @@ Bitbucket Server / Bitbucket Data Center connections support the following confi
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/bitbucket_server.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 	// Authentication alternatives: token OR password
 
diff --git a/docs/admin/code-hosts/gerrit.mdx b/docs/admin/code-hosts/gerrit.mdx
index 651b5093a..25db5a4ef 100644
--- a/docs/admin/code-hosts/gerrit.mdx
+++ b/docs/admin/code-hosts/gerrit.mdx
@@ -113,7 +113,7 @@ Gerrit connections support the following configuration options, which are specif
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/gerrit.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 	// If non-null, enforces Gerrit repository permissions. This requires that there is an item in the [site configuration json](https://sourcegraph.com/docs/admin/config/site_config#auth-providers) `auth.providers` field, of type "gerrit" with the same `url` field as specified in this `GerritConnection`.
diff --git a/docs/admin/code-hosts/github.mdx b/docs/admin/code-hosts/github.mdx
index 777eedc88..e461ad3a3 100644
--- a/docs/admin/code-hosts/github.mdx
+++ b/docs/admin/code-hosts/github.mdx
@@ -454,7 +454,7 @@ GitHub connections support the following configuration options, which are specif
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/github.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 	// Authentication alternatives: token OR gitHubAppDetails OR externalAccount OR useRandomExternalAccount
 
diff --git a/docs/admin/code-hosts/gitlab.mdx b/docs/admin/code-hosts/gitlab.mdx
index e125d1fee..e331cee12 100644
--- a/docs/admin/code-hosts/gitlab.mdx
+++ b/docs/admin/code-hosts/gitlab.mdx
@@ -189,7 +189,7 @@ See [Internal rate limits](/admin/code-hosts/rate-limits#internal-rate-limits).
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/gitlab.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 	// If non-null, enforces GitLab repository permissions. This requires that there be an item in the `auth.providers` field of type "gitlab" with the same `url` field as specified in this `GitLabConnection`.
diff --git a/docs/admin/code-hosts/gitolite.mdx b/docs/admin/code-hosts/gitolite.mdx
index d085e26ed..c9d61a59f 100644
--- a/docs/admin/code-hosts/gitolite.mdx
+++ b/docs/admin/code-hosts/gitolite.mdx
@@ -25,7 +25,7 @@ To connect Gitolite to Sourcegraph:
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/gitolite.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 	// A list of repositories to never mirror from this Gitolite instance. Supports excluding by exact name ({"name": "foo"}).
diff --git a/docs/admin/code-hosts/other.mdx b/docs/admin/code-hosts/other.mdx
index cb0ee85c5..bf95ea9b6 100644
--- a/docs/admin/code-hosts/other.mdx
+++ b/docs/admin/code-hosts/other.mdx
@@ -68,7 +68,7 @@ Repositories must be listed individually:
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/other_external_service.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 	// A list of repositories to never mirror by name after applying repositoryPathPattern. Supports excluding by exact name ({"name": "myrepo"}) or regular expression ({"pattern": ".*secret.*"}).
diff --git a/docs/admin/code-hosts/phabricator.mdx b/docs/admin/code-hosts/phabricator.mdx
index 5e05fdfaa..f2c50a6dd 100644
--- a/docs/admin/code-hosts/phabricator.mdx
+++ b/docs/admin/code-hosts/phabricator.mdx
@@ -76,7 +76,7 @@ The Sourcegraph instance's site admin must [update the `corsOrigin` site config
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/phabricator.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 	// SSH cipher to use when cloning via SSH. Must be a valid choice from `ssh -Q cipher`.
diff --git a/docs/admin/config/settings.mdx b/docs/admin/config/settings.mdx
index b0347f255..181d46e5d 100644
--- a/docs/admin/config/settings.mdx
+++ b/docs/admin/config/settings.mdx
@@ -27,7 +27,7 @@ Settings options and their default values are shown below.
 
 {/* SCHEMA_SYNC_START: admin/config/settings.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 
diff --git a/docs/admin/config/site-config.mdx b/docs/admin/config/site-config.mdx
index 36d8d9fe5..0750f3a89 100644
--- a/docs/admin/config/site-config.mdx
+++ b/docs/admin/config/site-config.mdx
@@ -21,7 +21,7 @@ All site configuration options and their default values are shown below.
 
 {/* SCHEMA_SYNC_START: admin/config/site.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 
@@ -448,6 +448,9 @@ All site configuration options and their default values are shown below.
 	// DEPRECATED: Configure maxRepos in search.limits
 	"maxReposToSearch": -1,
 
+	// Enable/disable MCP API endpoints under `/.api/mcp`. When disabled, MCP endpoints return 404.
+	"mcp.enabled": true,
+
 	"modelConfiguration": null,
 
 	// Notifications received from Sourcegraph.com to display in Sourcegraph.
@@ -648,7 +651,8 @@ All site configuration options and their default values are shown below.
 
 	"tls.external": null,
 
-	// The channel on which to automatically check for Sourcegraph updates.
+	// ⚠️  DEPRECATED: DEPRECATED: This setting has no effect.
+	// DEPRECATED: This setting has no effect.
 	// Valid options: "release", "none"
 	// Other example values:
 	// - "none"
@@ -737,7 +741,7 @@ All site configuration options and their default values are shown below.
 	// When enabled, users are required to connect at least one external account to their Sourcegraph account. Site admins are exempt from this requirement.
 	"auth.enforceExternalAccountConnection": false,
 
-	// Enables OAuth 2.0 Dynamic Client Registration (RFC 7591) for the Sourcegraph identity provider. When enabled, OAuth clients can self-register programmatically instead of requiring manual pre-configuration. Required for MCP clients and other applications that use dynamic registration for authorization.
+	// Enables OAuth 2.0 Dynamic Client Registration (RFC 7591) for the Sourcegraph identity provider. When enabled, OAuth clients can self-register programmatically instead of requiring manual pre-configuration. This is used for MCP clients; if `mcp.enabled` is `false`, this setting is treated as `false`.
 	"auth.idpDynamicClientRegistrationEnabled": true,
 
 	// The config options for account lockout
diff --git a/docs/admin/repo/perforce.mdx b/docs/admin/repo/perforce.mdx
index 55a6d31e4..524089737 100644
--- a/docs/admin/repo/perforce.mdx
+++ b/docs/admin/repo/perforce.mdx
@@ -228,7 +228,7 @@ With this setting, Sourcegraph will ignore any rules with a host other than `*`,
 
 {/* SCHEMA_SYNC_START: admin/code_hosts/perforce.schema.json */}
 {/* WARNING: This section is auto-generated during releases. Do not edit manually. */}
-{/* Last updated: 2026-03-06T20:59:17Z */}
+{/* Last updated: 2026-03-27T11:45:04Z */}
 ```json
 {
 	// If non-null, enforces Perforce depot permissions.
diff --git a/docs/admin/telemetry/private-metadata-allowlist.mdx b/docs/admin/telemetry/private-metadata-allowlist.mdx
index a887e247f..609fe90f9 100644
--- a/docs/admin/telemetry/private-metadata-allowlist.mdx
+++ b/docs/admin/telemetry/private-metadata-allowlist.mdx
@@ -33,4 +33,5 @@ To learn more, refer to the [telemetry documentation](https://sourcegraph.com/do
 | `cody.modelSelector` | _(all)_ | `modelId` — High-cardinality model identifier; helpful for determining the model selected in the model selector.<br/>`modelProvider` — High-cardinality model provider; helpful for determining the model selected in the model selector. |
 | `cody.smart-apply.context` | `applied` | `model` — High-cardinality model identifier; helpful for determining the model that was selected. |
 | `deepsearch` | `search.toolcall` | `toolName` — High-cardinality tool name; helpful for determining which tools are being used during deep search.<br/>`toolId` — High-cardinality tool identifier; helpful for determining which tools are being used during deep search.<br/>`model` — High-cardinality model identifier; helpful for determining which models are being used during deep search. |
+| `admin.users` | `delete` | `userIDs` — Numeric identifiers of users being deleted; needed for audit and analytics of admin user management actions. |
 | `externalApi` | `request` | `procedure` — ConnectRPC procedure path (e.g. '/sourcegraph.users.v1.UsersService/GetUser'); not sensitive and needed to distinguish which external API RPCs are being used. |
\ No newline at end of file
diff --git a/docs/cli/references/index.mdx b/docs/cli/references/index.mdx
index c511872ba..5f606371d 100644
--- a/docs/cli/references/index.mdx
+++ b/docs/cli/references/index.mdx
@@ -15,11 +15,11 @@
 * [`lsp`](references/lsp)
 * [`orgs`](references/orgs)
 * [`repos`](references/repos)
-* [`sbom` (deprecated)](references/sbom)
+* [`sbom`](references/sbom)
 * [`search`](references/search)
 * [`search-jobs`](references/search-jobs)
 * [`serve-git`](references/serve-git)
-* [`signature` (deprecated)](references/signature)
+* [`signature`](references/signature)
 * [`snapshot`](references/snapshot)
 * [`teams`](references/teams)
 * [`users`](references/users)
diff --git a/docs/cli/references/sbom.mdx b/docs/cli/references/sbom.mdx
index e3750cf6a..76dd910b3 100644
--- a/docs/cli/references/sbom.mdx
+++ b/docs/cli/references/sbom.mdx
@@ -1,13 +1,11 @@
 # `src sbom`
 
-<Callout type="warning">
-**Deprecated:** SBOMs are no longer generated for Sourcegraph releases after version 7.0.2852.
-</Callout>
+
 
 ## Usage
 
 ```
-'src sbom' fetches and verifies SBOM (Software Bill of Materials) data for Sourcegraph containers for releases 5.9.0 through 7.0.2852.
+'src sbom' fetches and verifies SBOM (Software Bill of Materials) data for Sourcegraph containers.
 
 Usage:
 
diff --git a/docs/cli/references/signature.mdx b/docs/cli/references/signature.mdx
index b050db010..a335f9ca9 100644
--- a/docs/cli/references/signature.mdx
+++ b/docs/cli/references/signature.mdx
@@ -1,13 +1,11 @@
 # `src signature`
 
-<Callout type="warning">
-**Deprecated:** Container signatures are no longer published for Sourcegraph releases after version 7.0.2852.
-</Callout>
+
 
 ## Usage
 
 ```
-'src signature' verifies published signatures for Sourcegraph containers for releases 5.11.4013 through 7.0.2852.
+'src signature' verifies published signatures for Sourcegraph containers.
 
 Usage:
 
diff --git a/docs/cody/capabilities/supported-models.mdx b/docs/cody/capabilities/supported-models.mdx
index 8d4f8b97c..35d0e019b 100644
--- a/docs/cody/capabilities/supported-models.mdx
+++ b/docs/cody/capabilities/supported-models.mdx
@@ -16,6 +16,7 @@ Cody supports a variety of cutting-edge large language models for use in chat an
 | :----------- | :-------- | :--------- | :----------------- |
 | Anthropic | [Claude Opus 4.6](https://docs.anthropic.com/en/docs/about-claude/models/overview) | ✅ | ✅ |
 | Anthropic | [Claude Sonnet 4.6](https://docs.anthropic.com/en/docs/about-claude/models/overview) | ✅ | ✅ |
+| Anthropic | [Claude Sonnet 4.6 with Thinking](https://docs.anthropic.com/en/docs/about-claude/models/overview) | ✅ | ✅ |
 | Anthropic | [Claude Sonnet 4.5](https://docs.anthropic.com/en/docs/about-claude/models/overview) | ✅ | ✅ |
 | Anthropic | [Claude Sonnet 4.5 with Thinking](https://docs.anthropic.com/en/docs/about-claude/models/overview) | ✅ | ✅ |
 | Anthropic | [Claude Opus 4.5](https://docs.anthropic.com/en/docs/about-claude/models/overview) | ✅ | ✅ |
@@ -24,9 +25,13 @@ Cody supports a variety of cutting-edge large language models for use in chat an
 | Anthropic | [Claude Haiku 4.5 with Thinking](https://docs.anthropic.com/en/docs/about-claude/models/overview) | ✅ | ✅ |
 | Google | [Gemini 2.5 Flash](https://cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/2-5-flash) | ✅ | ✅ |
 | Google | [Gemini 2.5 Pro](https://cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/2-5-pro) | ✅ | ✅ |
-| Google | [Gemini 3 Pro](https://cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-pro) | ✅ (experimental) | ❌ |
-| Google | [Gemini 3 Flash](https://cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-flash) | ✅ (experimental) | ❌ |
-| Google | [Gemini 3.1 Pro](https://cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-1-pro) | ✅ (experimental) | ❌ |
+| Google | [Gemini 3 Pro](https://cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-pro) | ✅ | ❌ |
+| Google | [Gemini 3 Flash](https://cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-flash) | ✅ | ❌ |
+| Google | [Gemini 3.1 Flash Lite](https://docs.cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-1-flash-lite) | ✅ | ❌ |
+| Google | [Gemini 3.1 Pro](https://cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-1-pro) | ✅ (beta) | ❌ |
+| OpenAI | [GPT-5.4](https://developers.openai.com/api/docs/models/gpt-5.4) | ✅ | ✅ |
+| OpenAI | [GPT-5.4 mini](https://developers.openai.com/api/docs/models/gpt-5.4-mini) | ✅ | ✅ |
+| OpenAI | [GPT-5.4 nano](https://developers.openai.com/api/docs/models/gpt-5.4-nano) | ✅ | ✅ |
 | OpenAI | [GPT-5.2](https://platform.openai.com/docs/models/gpt-5.2) | ✅ | ✅ |
 | OpenAI | [GPT-5.1](https://platform.openai.com/docs/models/gpt-5.1) | ✅ | ✅ |
 | OpenAI | [GPT-5](https://platform.openai.com/docs/models/gpt-5) | ✅ | ✅ |
@@ -55,7 +60,7 @@ Cody uses a set of models for autocomplete which are suited for the low latency
 | Anthropic | [Claude Haiku 4.5 with Thinking](https://docs.anthropic.com/en/docs/about-claude/models/overview) | ✅ |
 | Fireworks.ai | StarCoder | ✅ |
 | Fireworks.ai | DeepSeek V2 Lite Base | ✅ |
-| Fireworks.ai | AutoEdits Fireworks Default | ✅ (experimental) |
+| Fireworks.ai | AutoEdits Fireworks Default | ✅ (beta) |
 | Fireworks.ai | Autoedits DeepSeek Coder V2 | ✅ (beta) |
 | Fireworks.ai | Autoedits DeepSeek Coder V2 | ✅ (beta) |
 | Fireworks.ai | Autoedits DeepSeek Coder V2 | ✅ (beta) |
@@ -69,7 +74,7 @@ Cody uses a set of models for autocomplete which are suited for the low latency
 | **Provider** | **Model** | **Status** |
 | :----------- | :-------- | :--------- |
 | Fireworks.ai | Smart Apply Qwen Default | ✅ |
-| Fireworks.ai | Smart Apply Qwen 32B V1 | ✅ (experimental) |
+| Fireworks.ai | Smart Apply Qwen 32B V1 | ✅ (beta) |
 
 ## Default Models
 
diff --git a/docs/self-hosted/observability/alerts.mdx b/docs/self-hosted/observability/alerts.mdx
index d857b648f..4bfec8ea2 100644
--- a/docs/self-hosted/observability/alerts.mdx
+++ b/docs/self-hosted/observability/alerts.mdx
@@ -897,6 +897,43 @@ Generated query for warning alert: `max((sum by (name, job_name) (rate(src_perio
 
 <br />
 
+## frontend: goroutine_error_percentage_long_window
+
+<p class="subtitle">percentage of failed periodic goroutine executions over a long window</p>
+
+**Descriptions**
+
+- <span class="badge badge-warning">warning</span> frontend: 30%+ percentage of failed periodic goroutine executions over a long window for 3h0m0s
+- <span class="badge badge-critical">critical</span> frontend: 50%+ percentage of failed periodic goroutine executions over a long window for 3h0m0s
+
+**Next steps**
+
+- Check service logs for error details related to the failing periodic routine
+- Check if the routine depends on external services that may be unavailable
+- Consider temporarily disabling the routine if it`s non-critical and causing cascading issues
+- More help interpreting this metric is available in the [dashboards reference](dashboards#frontend-goroutine_error_percentage_long_window).
+- **Silence this alert:** If you are aware of this alert and want to silence notifications for it, add the following to your site configuration and set a reminder to re-evaluate the alert:
+
+```json
+"observability.silenceAlerts": [
+  "warning_frontend_goroutine_error_percentage_long_window",
+  "critical_frontend_goroutine_error_percentage_long_window"
+]
+```
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Generated query for warning alert: `max(((sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*frontend.*"\}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total\{job=~".*frontend.*"}[6h])), 1)) * 100) &gt;= 30)`
+
+Generated query for critical alert: `max(((sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*frontend.*"\}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total\{job=~".*frontend.*"}[6h])), 1)) * 100) &gt;= 50)`
+
+</details>
+
+<br />
+
 ## frontend: mean_blocked_seconds_per_conn_request
 
 <p class="subtitle">mean blocked seconds per conn request</p>
@@ -1386,37 +1423,6 @@ Generated query for critical alert: `min(((src_gitserver_disk_space_available /
 
 <br />
 
-## gitserver: cpu_throttling_time
-
-<p class="subtitle">container CPU throttling time %</p>
-
-**Descriptions**
-
-- <span class="badge badge-warning">warning</span> gitserver: 75%+ container CPU throttling time % for 2m0s
-
-**Next steps**
-
-- 	- Consider increasing the CPU limit for the container.
-- More help interpreting this metric is available in the [dashboards reference](dashboards#gitserver-cpu_throttling_time).
-- **Silence this alert:** If you are aware of this alert and want to silence notifications for it, add the following to your site configuration and set a reminder to re-evaluate the alert:
-
-```json
-"observability.silenceAlerts": [
-  "warning_gitserver_cpu_throttling_time"
-]
-```
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Generated query for warning alert: `max((sum by (container_label_io_kubernetes_pod_name) ((rate(container_cpu_cfs_throttled_periods_total{container_label_io_kubernetes_container_name="gitserver"\}[5m]) / rate(container_cpu_cfs_periods_total\{container_label_io_kubernetes_container_name="gitserver"}[5m])) * 100)) &gt;= 75)`
-
-</details>
-
-<br />
-
 ## gitserver: echo_command_duration_test
 
 <p class="subtitle">echo test command duration</p>
@@ -1513,6 +1519,99 @@ Generated query for warning alert: `max((sum(src_gitserver_clone_queue)) &gt;= 2
 
 <br />
 
+## gitserver: cpu_usage_percentage
+
+<p class="subtitle">CPU usage</p>
+
+**Descriptions**
+
+- <span class="badge badge-warning">warning</span> gitserver: 95%+ CPU usage for 10m0s
+
+**Next steps**
+
+- Consider increasing CPU limits or scaling out.
+- Learn more about the related dashboard panel in the [dashboards reference](dashboards#gitserver-cpu_usage_percentage).
+- **Silence this alert:** If you are aware of this alert and want to silence notifications for it, add the following to your site configuration and set a reminder to re-evaluate the alert:
+
+```json
+"observability.silenceAlerts": [
+  "warning_gitserver_cpu_usage_percentage"
+]
+```
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Generated query for warning alert: `max((cadvisor_container_cpu_usage_percentage_total{name=~"^gitserver.*"}) &gt;= 95)`
+
+</details>
+
+<br />
+
+## gitserver: memory_rss
+
+<p class="subtitle">memory (RSS)</p>
+
+**Descriptions**
+
+- <span class="badge badge-warning">warning</span> gitserver: 90%+ memory (RSS) for 10m0s
+
+**Next steps**
+
+- Consider increasing memory limits or scaling out.
+- More help interpreting this metric is available in the [dashboards reference](dashboards#gitserver-memory_rss).
+- **Silence this alert:** If you are aware of this alert and want to silence notifications for it, add the following to your site configuration and set a reminder to re-evaluate the alert:
+
+```json
+"observability.silenceAlerts": [
+  "warning_gitserver_memory_rss"
+]
+```
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Generated query for warning alert: `max((max by (name) (container_memory_rss{name=~"^gitserver.*"\} / container_spec_memory_limit_bytes\{name=~"^gitserver.*"}) * 100) &gt;= 90)`
+
+</details>
+
+<br />
+
+## gitserver: cpu_throttling_time
+
+<p class="subtitle">container CPU throttling time %</p>
+
+**Descriptions**
+
+- <span class="badge badge-warning">warning</span> gitserver: 75%+ container CPU throttling time % for 2m0s
+
+**Next steps**
+
+- Consider increasing the CPU limit for the container.
+- More help interpreting this metric is available in the [dashboards reference](dashboards#gitserver-cpu_throttling_time).
+- **Silence this alert:** If you are aware of this alert and want to silence notifications for it, add the following to your site configuration and set a reminder to re-evaluate the alert:
+
+```json
+"observability.silenceAlerts": [
+  "warning_gitserver_cpu_throttling_time"
+]
+```
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Generated query for warning alert: `max((sum by (container_label_io_kubernetes_pod_name) ((rate(container_cpu_cfs_throttled_periods_total{container_label_io_kubernetes_container_name="gitserver"\}[5m]) / rate(container_cpu_cfs_periods_total\{container_label_io_kubernetes_container_name="gitserver"}[5m])) * 100)) &gt;= 75)`
+
+</details>
+
+<br />
+
 ## gitserver: git_command_retry_attempts_rate
 
 <p class="subtitle">rate of git command corruption retry attempts over 5m</p>
@@ -1613,23 +1712,27 @@ Generated query for warning alert: `max((sum by (name, job_name) (rate(src_perio
 
 <br />
 
-## gitserver: cpu_usage_percentage
+## gitserver: goroutine_error_percentage_long_window
 
-<p class="subtitle">CPU usage</p>
+<p class="subtitle">percentage of failed periodic goroutine executions over a long window</p>
 
 **Descriptions**
 
-- <span class="badge badge-warning">warning</span> gitserver: 95%+ CPU usage for 10m0s
+- <span class="badge badge-warning">warning</span> gitserver: 30%+ percentage of failed periodic goroutine executions over a long window for 3h0m0s
+- <span class="badge badge-critical">critical</span> gitserver: 50%+ percentage of failed periodic goroutine executions over a long window for 3h0m0s
 
 **Next steps**
 
-- Consider increasing CPU limits or scaling out.
-- Learn more about the related dashboard panel in the [dashboards reference](dashboards#gitserver-cpu_usage_percentage).
+- Check service logs for error details related to the failing periodic routine
+- Check if the routine depends on external services that may be unavailable
+- Consider temporarily disabling the routine if it`s non-critical and causing cascading issues
+- More help interpreting this metric is available in the [dashboards reference](dashboards#gitserver-goroutine_error_percentage_long_window).
 - **Silence this alert:** If you are aware of this alert and want to silence notifications for it, add the following to your site configuration and set a reminder to re-evaluate the alert:
 
 ```json
 "observability.silenceAlerts": [
-  "warning_gitserver_cpu_usage_percentage"
+  "warning_gitserver_goroutine_error_percentage_long_window",
+  "critical_gitserver_goroutine_error_percentage_long_window"
 ]
 ```
 
@@ -1638,38 +1741,9 @@ Generated query for warning alert: `max((sum by (name, job_name) (rate(src_perio
 <details>
 <summary>Technical details</summary>
 
-Generated query for warning alert: `max((cadvisor_container_cpu_usage_percentage_total{name=~"^gitserver.*"}) &gt;= 95)`
-
-</details>
-
-<br />
-
-## gitserver: memory_rss
-
-<p class="subtitle">memory (RSS)</p>
-
-**Descriptions**
+Generated query for warning alert: `max(((sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*gitserver.*"\}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total\{job=~".*gitserver.*"}[6h])), 1)) * 100) &gt;= 30)`
 
-- <span class="badge badge-warning">warning</span> gitserver: 90%+ memory (RSS) for 10m0s
-
-**Next steps**
-
-- Consider increasing memory limits or scaling out.
-- More help interpreting this metric is available in the [dashboards reference](dashboards#gitserver-memory_rss).
-- **Silence this alert:** If you are aware of this alert and want to silence notifications for it, add the following to your site configuration and set a reminder to re-evaluate the alert:
-
-```json
-"observability.silenceAlerts": [
-  "warning_gitserver_memory_rss"
-]
-```
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Generated query for warning alert: `max((max by (name) (container_memory_rss{name=~"^gitserver.*"\} / container_spec_memory_limit_bytes\{name=~"^gitserver.*"}) * 100) &gt;= 90)`
+Generated query for critical alert: `max(((sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*gitserver.*"\}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total\{job=~".*gitserver.*"}[6h])), 1)) * 100) &gt;= 50)`
 
 </details>
 
@@ -3883,6 +3957,43 @@ Generated query for warning alert: `max((sum by (name, job_name) (rate(src_perio
 
 <br />
 
+## worker: goroutine_error_percentage_long_window
+
+<p class="subtitle">percentage of failed periodic goroutine executions over a long window</p>
+
+**Descriptions**
+
+- <span class="badge badge-warning">warning</span> worker: 30%+ percentage of failed periodic goroutine executions over a long window for 3h0m0s
+- <span class="badge badge-critical">critical</span> worker: 50%+ percentage of failed periodic goroutine executions over a long window for 3h0m0s
+
+**Next steps**
+
+- Check service logs for error details related to the failing periodic routine
+- Check if the routine depends on external services that may be unavailable
+- Consider temporarily disabling the routine if it`s non-critical and causing cascading issues
+- More help interpreting this metric is available in the [dashboards reference](dashboards#worker-goroutine_error_percentage_long_window).
+- **Silence this alert:** If you are aware of this alert and want to silence notifications for it, add the following to your site configuration and set a reminder to re-evaluate the alert:
+
+```json
+"observability.silenceAlerts": [
+  "warning_worker_goroutine_error_percentage_long_window",
+  "critical_worker_goroutine_error_percentage_long_window"
+]
+```
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Generated query for warning alert: `max(((sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*worker.*"\}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total\{job=~".*worker.*"}[6h])), 1)) * 100) &gt;= 30)`
+
+Generated query for critical alert: `max(((sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*worker.*"\}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total\{job=~".*worker.*"}[6h])), 1)) * 100) &gt;= 50)`
+
+</details>
+
+<br />
+
 ## worker: mean_blocked_seconds_per_conn_request
 
 <p class="subtitle">mean blocked seconds per conn request</p>
@@ -4488,6 +4599,43 @@ Generated query for warning alert: `max((sum by (name, job_name) (rate(src_perio
 
 <br />
 
+## searcher: goroutine_error_percentage_long_window
+
+<p class="subtitle">percentage of failed periodic goroutine executions over a long window</p>
+
+**Descriptions**
+
+- <span class="badge badge-warning">warning</span> searcher: 30%+ percentage of failed periodic goroutine executions over a long window for 3h0m0s
+- <span class="badge badge-critical">critical</span> searcher: 50%+ percentage of failed periodic goroutine executions over a long window for 3h0m0s
+
+**Next steps**
+
+- Check service logs for error details related to the failing periodic routine
+- Check if the routine depends on external services that may be unavailable
+- Consider temporarily disabling the routine if it`s non-critical and causing cascading issues
+- More help interpreting this metric is available in the [dashboards reference](dashboards#searcher-goroutine_error_percentage_long_window).
+- **Silence this alert:** If you are aware of this alert and want to silence notifications for it, add the following to your site configuration and set a reminder to re-evaluate the alert:
+
+```json
+"observability.silenceAlerts": [
+  "warning_searcher_goroutine_error_percentage_long_window",
+  "critical_searcher_goroutine_error_percentage_long_window"
+]
+```
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Generated query for warning alert: `max(((sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*searcher.*"\}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total\{job=~".*searcher.*"}[6h])), 1)) * 100) &gt;= 30)`
+
+Generated query for critical alert: `max(((sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*searcher.*"\}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total\{job=~".*searcher.*"}[6h])), 1)) * 100) &gt;= 50)`
+
+</details>
+
+<br />
+
 ## searcher: mean_blocked_seconds_per_conn_request
 
 <p class="subtitle">mean blocked seconds per conn request</p>
diff --git a/docs/self-hosted/observability/dashboards.mdx b/docs/self-hosted/observability/dashboards.mdx
index dce0c86d8..c31f05a89 100644
--- a/docs/self-hosted/observability/dashboards.mdx
+++ b/docs/self-hosted/observability/dashboards.mdx
@@ -4539,6 +4539,32 @@ sum by (name, job_name) (rate(src_periodic_goroutine_errors_total{job=~".*fronte
 
 <br />
 
+#### frontend: goroutine_error_percentage_long_window
+
+<p class="subtitle">Percentage of failed periodic goroutine executions over a long window</p>
+
+The percentage of failed executions over the last 6 hours for each periodic goroutine.
+A value above 30% sustained for at least 3 hours indicates persistent failures.
+A value above 50% sustained for at least 3 hours indicates that most executions are failing continuously.
+
+Refer to the [alerts reference](alerts#frontend-goroutine_error_percentage_long_window) for 2 alerts related to this panel.
+
+To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102920` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+(sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*frontend.*"}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total{job=~".*frontend.*"}[6h])), 1)) * 100
+```
+</details>
+
+<br />
+
 #### frontend: goroutine_handler_duration
 
 <p class="subtitle">95th percentile handler execution time</p>
@@ -4548,7 +4574,7 @@ Longer durations might indicate increased load or processing time.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102920` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102930` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -4573,7 +4599,7 @@ This represents how long a complete loop iteration takes before sleeping for the
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102921` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102931` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -4598,7 +4624,7 @@ Higher values indicate that tenant processing is taking longer and may affect ov
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102930` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102940` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -4623,7 +4649,7 @@ Consistently high values might indicate problematic tenants or inefficient proce
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102931` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102941` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -4648,7 +4674,7 @@ Unexpected changes can indicate tenant configuration issues or scaling events.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102940` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102950` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -4673,7 +4699,7 @@ A healthy routine should maintain a consistent processing rate.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102941` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102951` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -4698,7 +4724,7 @@ Consistent errors indicate problems with specific tenants.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102950` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102960` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -4723,7 +4749,7 @@ Values above 5% indicate significant tenant processing problems.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102951` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/frontend/frontend?viewPanel=102961` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -4993,7 +5019,7 @@ max by (name) (container_memory_working_set_bytes{name=~"^(frontend|sourcegraph-
 
 <p class="subtitle">Memory (RSS)</p>
 
-The total anonymous memory in use by the application, which includes Go stack and heap. This memory is is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS because to match the cadvisor name, but `anonymous` is more accurate."
+The total anonymous memory in use by the application, which includes Go stack and heap. This memory is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS to match the cadvisor name, but "anonymous" is more accurate.
 
 Refer to the [alerts reference](alerts#frontend-memory_rss) for 1 alert related to this panel.
 
@@ -6025,66 +6051,22 @@ Query:
 
 <br />
 
-#### gitserver: cpu_throttling_time
-
-<p class="subtitle">Container CPU throttling time %</p>
-
-- A high value indicates that the container is spending too much time waiting for CPU cycles.
-
-Refer to the [alerts reference](alerts#gitserver-cpu_throttling_time) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100010` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (container_label_io_kubernetes_pod_name) ((rate(container_cpu_cfs_throttled_periods_total{container_label_io_kubernetes_container_name="gitserver", container_label_io_kubernetes_pod_name=~`${shard:regex}`}[5m]) / rate(container_cpu_cfs_periods_total{container_label_io_kubernetes_container_name="gitserver", container_label_io_kubernetes_pod_name=~`${shard:regex}`}[5m])) * 100)
-```
-</details>
-
-<br />
-
-#### gitserver: cpu_usage_seconds
-
-<p class="subtitle">Cpu usage seconds</p>
-
-- This value should not exceed 75% of the CPU limit over a longer period of time.
-	- We cannot alert on this as we don`t know the resource allocation.
-
-	- If this value is high for a longer time, consider increasing the CPU limit for the container.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100011` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (container_label_io_kubernetes_pod_name) (rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name="gitserver", container_label_io_kubernetes_pod_name=~`${shard:regex}`}[5m]))
-```
-</details>
+#### gitserver: high_memory_git_commands
 
-<br />
+<p class="subtitle">Number of git commands that exceeded the threshold for high memory usage</p>
 
-#### gitserver: memory_major_page_faults
+This graph tracks the number of git subcommands that gitserver ran that exceeded the threshold for high memory usage.
+This graph in itself is not an alert, but it is used to learn about the memory usage of gitserver.
 
-<p class="subtitle">Gitserver page faults</p>
+If gitserver frequently serves requests where the status code is KILLED, this graph might help to correlate that
+with the high memory usage.
 
-The number of major page faults in a 5 minute window for gitserver. If this number increases significantly, it indicates that more git API calls need to load data from disk. There may not be enough memory to efficiently support the amount of API requests served concurrently.
+This graph spiking is not a problem necessarily. But when subcommands or the whole gitserver service are getting
+OOM killed and this graph shows spikes, increasing the memory might be useful.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100020` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100010` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6094,28 +6076,21 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10002
 Query:
 
 ```
-rate(container_memory_failures_total{failure_type="pgmajfault", name=~"^gitserver.*"}[5m])
+sort_desc(sum(sum_over_time(src_gitserver_exec_high_memory_usage_count{instance=~`${shard:regex}`}[2m])) by (cmd))
 ```
 </details>
 
 <br />
 
-#### gitserver: high_memory_git_commands
-
-<p class="subtitle">Number of git commands that exceeded the threshold for high memory usage</p>
-
-This graph tracks the number of git subcommands that gitserver ran that exceeded the threshold for high memory usage.
-This graph in itself is not an alert, but it is used to learn about the memory usage of gitserver.
+#### gitserver: running_git_commands
 
-If gitserver frequently serves requests where the status code is KILLED, this graph might help to correlate that
-with the high memory usage.
+<p class="subtitle">Git commands running on each gitserver instance</p>
 
-This graph spiking is not a problem necessarily. But when subcommands or the whole gitserver service are getting
-OOM killed and this graph shows spikes, increasing the memory might be useful.
+A high value signals load.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100021` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100011` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6125,21 +6100,21 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10002
 Query:
 
 ```
-sort_desc(sum(sum_over_time(src_gitserver_exec_high_memory_usage_count{instance=~`${shard:regex}`}[2m])) by (cmd))
+sum by (instance, cmd) (src_gitserver_exec_running{instance=~`${shard:regex}`})
 ```
 </details>
 
 <br />
 
-#### gitserver: running_git_commands
+#### gitserver: git_commands_received
 
-<p class="subtitle">Git commands running on each gitserver instance</p>
+<p class="subtitle">Rate of git commands received</p>
 
-A high value signals load.
+per second rate per command
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100030` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100012` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6149,21 +6124,22 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10003
 Query:
 
 ```
-sum by (instance, cmd) (src_gitserver_exec_running{instance=~`${shard:regex}`})
+sum by (cmd) (rate(src_gitserver_exec_duration_seconds_count{instance=~`${shard:regex}`}[5m]))
 ```
 </details>
 
 <br />
 
-#### gitserver: git_commands_received
+#### gitserver: git_command_cpu_usage_seconds_by_scope
 
-<p class="subtitle">Rate of git commands received</p>
+<p class="subtitle">Git command CPU usage seconds by requester scope</p>
 
-per second rate per command
+CPU time consumed by git subcommands, grouped by propagated requester scope and CPU kind.
+Use this to identify high-CPU callers and whether time is spent in user or system CPU.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100031` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100013` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6173,7 +6149,7 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10003
 Query:
 
 ```
-sum by (cmd) (rate(src_gitserver_exec_duration_seconds_count{instance=~`${shard:regex}`}[5m]))
+topk(20, sum by (scope, kind) (rate(src_gitserver_exec_cpu_seconds_total{instance=~`${shard:regex}`}[5m])))
 ```
 </details>
 
@@ -6187,7 +6163,7 @@ sum by (cmd) (rate(src_gitserver_exec_duration_seconds_count{instance=~`${shard:
 
 Refer to the [alerts reference](alerts#gitserver-echo_command_duration_test) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100040` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100020` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6213,7 +6189,7 @@ by recloning repositories, but this may take a while depending on repo size.
 
 Refer to the [alerts reference](alerts#gitserver-repo_corrupted) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100041` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100021` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6235,7 +6211,7 @@ sum(rate(src_gitserver_repo_corrupted[5m]))
 
 Refer to the [alerts reference](alerts#gitserver-repository_clone_queue_size) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100050` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100030` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6261,7 +6237,7 @@ It does not indicate any problems with the instance, but can give a good indicat
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100051` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100031` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6277,15 +6253,26 @@ sum by (job, instance) (src_gitserver_client_concurrent_requests)
 
 <br />
 
-### Git Server: Gitservice for internal cloning
+### Git Server: Gitserver (CPU, Memory)
 
-#### gitserver: gitservice_request_duration
+Gitserver leverages memory mapping to optimize file reads: it is generally expected to consume all the memory provided to it, if it can. When it finds data that is not available in memory yet, this causes a 'page fault', and the data is loaded into memory from disk.
 
-<p class="subtitle">95th percentile gitservice request duration per shard</p>
+A trend to watch out for: when something in-application happens to take a lot of memory, and active file previously used nearly all remaining memory, then:
 
-A high value means any internal service trying to clone a repo from gitserver is slowed down.
+1. 'Memory (RSS)' goes up, due to in-application usage
+2. 'Memory usage (Active file)' goes down, as file data held in memory is evicted
+3. 'Page faults' go up, as less data is held in memory (and with that, IOPS, disk read throughput, ...)
 
-This panel has no related alerts.
+This can also happen without 'Memory (RSS)' increasing, if the provisioned memory is insufficent to start with.
+A small degree of this is behaviour generally expected, but if it happens significantly or causes user-noticeable impact, it's likely gitserver could benefit from more memory. Look for more user-facing metrics to make a final determination on appropriate resource allocation.
+
+_See https://en.wikipedia.org/wiki/Memory-mapped_file and the related articles for more information about memory maps._
+
+#### gitserver: cpu_usage_percentage
+
+<p class="subtitle">CPU usage</p>
+
+Refer to the [alerts reference](alerts#gitserver-cpu_usage_percentage) for 1 alert related to this panel.
 
 To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100100` on your Sourcegraph instance.
 
@@ -6297,17 +6284,17 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10010
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_gitserver_gitservice_duration_seconds_bucket{instance=~`${shard:regex}`}[5m])) by (le, gitservice))
+cadvisor_container_cpu_usage_percentage_total{name=~"^gitserver.*"}
 ```
 </details>
 
 <br />
 
-#### gitserver: gitservice_request_rate
+#### gitserver: memory_usage_percentage
 
-<p class="subtitle">Gitservice request rate per shard</p>
+<p class="subtitle">Memory usage percentage (total)</p>
 
-Per shard gitservice request rate
+An estimate for the active memory in use, which includes anonymous memory, file memory, and kernel memory. Some of this memory is reclaimable, so high usage does not necessarily indicate memory pressure.
 
 This panel has no related alerts.
 
@@ -6321,17 +6308,17 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10010
 Query:
 
 ```
-sum(rate(src_gitserver_gitservice_duration_seconds_count{instance=~`${shard:regex}`}[5m])) by (gitservice)
+cadvisor_container_memory_usage_percentage_total{name=~"^gitserver.*"}
 ```
 </details>
 
 <br />
 
-#### gitserver: gitservice_requests_running
+#### gitserver: memory_working_set_bytes
 
-<p class="subtitle">Gitservice requests running per shard</p>
+<p class="subtitle">Memory usage bytes (total)</p>
 
-Per shard gitservice requests running
+An estimate for the active memory in use in bytes, which includes anonymous memory, file memory, and kernel memory. Some of this memory is reclaimable, so high usage does not necessarily indicate memory pressure.
 
 This panel has no related alerts.
 
@@ -6345,23 +6332,21 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10010
 Query:
 
 ```
-sum(src_gitserver_gitservice_running{instance=~`${shard:regex}`}) by (gitservice)
+max by (name) (container_memory_working_set_bytes{name=~"^gitserver.*"})
 ```
 </details>
 
 <br />
 
-### Git Server: Gitserver cleanup jobs
-
-#### gitserver: janitor_tasks_total
+#### gitserver: memory_rss
 
-<p class="subtitle">Total housekeeping tasks by type and status</p>
+<p class="subtitle">Memory (RSS)</p>
 
-The rate of housekeeping tasks performed in repositories, broken down by task type and success/failure status
+The total anonymous memory in use by the application, which includes Go stack and heap. This memory is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS to match the cadvisor name, but "anonymous" is more accurate.
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#gitserver-memory_rss) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100200` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100110` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6371,21 +6356,21 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10020
 Query:
 
 ```
-sum(rate(src_gitserver_janitor_tasks_total{instance=~`${shard:regex}`}[5m])) by (housekeeping_task, status)
+max(container_memory_rss{name=~"^gitserver.*"} / container_spec_memory_limit_bytes{name=~"^gitserver.*"}) by (name) * 100.0 
 ```
 </details>
 
 <br />
 
-#### gitserver: p90_janitor_tasks_latency_success_over_5m
+#### gitserver: memory_total_active_file
 
-<p class="subtitle">90th percentile latency of successful tasks by type over 5m</p>
+<p class="subtitle">Memory usage (active file)</p>
 
-The 90th percentile latency of successful housekeeping tasks, broken down by task type
+This metric shows the total active file-backed memory currently in use by the application. Some of it may be reclaimable, so high usage does not necessarily indicate memory pressure.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100210` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100111` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6395,21 +6380,21 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10021
 Query:
 
 ```
-histogram_quantile(0.90, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="success"}[5m])) by (le, housekeeping_task))
+max(container_memory_total_active_file_bytes{name=~"^gitserver.*"} / container_spec_memory_limit_bytes{name=~"^gitserver.*"}) by (name) * 100.0 
 ```
 </details>
 
 <br />
 
-#### gitserver: p95_janitor_tasks_latency_success_over_5m
+#### gitserver: memory_kernel_usage
 
-<p class="subtitle">95th percentile latency of successful tasks by type over 5m</p>
+<p class="subtitle">Memory usage (kernel)</p>
 
-The 95th percentile latency of successful housekeeping tasks, broken down by task type
+The kernel usage metric shows the amount of memory used by the kernel on behalf of the application. Some of it may be reclaimable, so high usage does not necessarily indicate memory pressure.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100211` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100112` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6419,21 +6404,21 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10021
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="success"}[5m])) by (le, housekeeping_task))
+max(container_memory_kernel_usage{name=~"^gitserver.*"} / container_spec_memory_limit_bytes{name=~"^gitserver.*"}) by (name) * 100.0 
 ```
 </details>
 
 <br />
 
-#### gitserver: p99_janitor_tasks_latency_success_over_5m
+#### gitserver: memory_major_page_faults
 
-<p class="subtitle">99th percentile latency of successful tasks by type over 5m</p>
+<p class="subtitle">Gitserver page faults</p>
 
-The 99th percentile latency of successful housekeeping tasks, broken down by task type
+The number of major page faults in a 5 minute window for gitserver. If this number increases significantly, it indicates that more git API calls need to load data from disk. There may not be enough memory to efficiently support the amount of API requests served concurrently.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100212` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100120` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6443,21 +6428,21 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10021
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="success"}[5m])) by (le, housekeeping_task))
+rate(container_memory_failures_total{failure_type="pgmajfault", name=~"^gitserver.*"}[5m])
 ```
 </details>
 
 <br />
 
-#### gitserver: p90_janitor_tasks_latency_failure_over_5m
+#### gitserver: cpu_throttling_time
 
-<p class="subtitle">90th percentile latency of failed tasks by type over 5m</p>
+<p class="subtitle">Container CPU throttling time %</p>
 
-The 90th percentile latency of failed housekeeping tasks, broken down by task type
+A high value indicates that the container is spending too much time waiting for CPU cycles.
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#gitserver-cpu_throttling_time) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100220` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100130` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6467,21 +6452,23 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10022
 Query:
 
 ```
-histogram_quantile(0.90, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="failure"}[5m])) by (le, housekeeping_task))
+sum by (container_label_io_kubernetes_pod_name) ((rate(container_cpu_cfs_throttled_periods_total{container_label_io_kubernetes_container_name="gitserver", container_label_io_kubernetes_pod_name=~`${shard:regex}`}[5m]) / rate(container_cpu_cfs_periods_total{container_label_io_kubernetes_container_name="gitserver", container_label_io_kubernetes_pod_name=~`${shard:regex}`}[5m])) * 100)
 ```
 </details>
 
 <br />
 
-#### gitserver: p95_janitor_tasks_latency_failure_over_5m
+#### gitserver: cpu_usage_seconds
 
-<p class="subtitle">95th percentile latency of failed tasks by type over 5m</p>
+<p class="subtitle">Cpu usage seconds</p>
 
-The 95th percentile latency of failed housekeeping tasks, broken down by task type
+- This value should not exceed 75% of the CPU limit over a longer period of time.
+- We cannot alert on this as we don`t know the resource allocation.
+- If this value is high for a longer time, consider increasing the CPU limit for the container.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100221` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100131` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6491,21 +6478,23 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10022
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="failure"}[5m])) by (le, housekeeping_task))
+sum by (container_label_io_kubernetes_pod_name) (rate(container_cpu_usage_seconds_total{container_label_io_kubernetes_container_name="gitserver", container_label_io_kubernetes_pod_name=~`${shard:regex}`}[5m]))
 ```
 </details>
 
 <br />
 
-#### gitserver: p99_janitor_tasks_latency_failure_over_5m
+### Git Server: Gitservice for internal cloning
 
-<p class="subtitle">99th percentile latency of failed tasks by type over 5m</p>
+#### gitserver: gitservice_request_duration
 
-The 99th percentile latency of failed housekeeping tasks, broken down by task type
+<p class="subtitle">95th percentile gitservice request duration per shard</p>
+
+A high value means any internal service trying to clone a repo from gitserver is slowed down.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100222` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100200` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6515,21 +6504,21 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10022
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="failure"}[5m])) by (le, housekeeping_task))
+histogram_quantile(0.95, sum(rate(src_gitserver_gitservice_duration_seconds_bucket{instance=~`${shard:regex}`}[5m])) by (le, gitservice))
 ```
 </details>
 
 <br />
 
-#### gitserver: pruned_files_total_over_5m
+#### gitserver: gitservice_request_rate
 
-<p class="subtitle">Files pruned by type over 5m</p>
+<p class="subtitle">Gitservice request rate per shard</p>
 
-The rate of files pruned during cleanup, broken down by file type
+Per shard gitservice request rate
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100230` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100201` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6539,21 +6528,21 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10023
 Query:
 
 ```
-sum(rate(src_gitserver_janitor_pruned_files_total{instance=~`${shard:regex}`}[5m])) by (filetype)
+sum(rate(src_gitserver_gitservice_duration_seconds_count{instance=~`${shard:regex}`}[5m])) by (gitservice)
 ```
 </details>
 
 <br />
 
-#### gitserver: data_structure_count_over_5m
+#### gitserver: gitservice_requests_running
 
-<p class="subtitle">Data structure counts over 5m</p>
+<p class="subtitle">Gitservice requests running per shard</p>
 
-The count distribution of various Git data structures in repositories
+Per shard gitservice requests running
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100240` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100202` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6563,21 +6552,23 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10024
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_gitserver_janitor_data_structure_count_bucket{instance=~`${shard:regex}`}[5m])) by (le, data_structure))
+sum(src_gitserver_gitservice_running{instance=~`${shard:regex}`}) by (gitservice)
 ```
 </details>
 
 <br />
 
-#### gitserver: janitor_data_structure_size
+### Git Server: Gitserver cleanup jobs
 
-<p class="subtitle">Data structure sizes</p>
+#### gitserver: janitor_tasks_total
 
-The size distribution of various Git data structures in repositories
+<p class="subtitle">Total housekeeping tasks by type and status</p>
+
+The rate of housekeeping tasks performed in repositories, broken down by task type and success/failure status
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100250` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100300` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6587,21 +6578,237 @@ To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=10025
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_gitserver_janitor_data_structure_size_bucket{instance=~`${shard:regex}`}[5m])) by (le, data_structure))
+sum(rate(src_gitserver_janitor_tasks_total{instance=~`${shard:regex}`}[5m])) by (housekeeping_task, status)
 ```
 </details>
 
 <br />
 
-#### gitserver: janitor_time_since_optimization
+#### gitserver: p90_janitor_tasks_latency_success_over_5m
 
-<p class="subtitle">Time since last optimization</p>
+<p class="subtitle">90th percentile latency of successful tasks by type over 5m</p>
 
-The time elapsed since last optimization of various Git data structures
+The 90th percentile latency of successful housekeeping tasks, broken down by task type
+
+This panel has no related alerts.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100310` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+histogram_quantile(0.90, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="success"}[5m])) by (le, housekeeping_task))
+```
+</details>
+
+<br />
+
+#### gitserver: p95_janitor_tasks_latency_success_over_5m
+
+<p class="subtitle">95th percentile latency of successful tasks by type over 5m</p>
+
+The 95th percentile latency of successful housekeeping tasks, broken down by task type
+
+This panel has no related alerts.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100311` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+histogram_quantile(0.95, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="success"}[5m])) by (le, housekeeping_task))
+```
+</details>
+
+<br />
+
+#### gitserver: p99_janitor_tasks_latency_success_over_5m
+
+<p class="subtitle">99th percentile latency of successful tasks by type over 5m</p>
+
+The 99th percentile latency of successful housekeeping tasks, broken down by task type
+
+This panel has no related alerts.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100312` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+histogram_quantile(0.99, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="success"}[5m])) by (le, housekeeping_task))
+```
+</details>
+
+<br />
+
+#### gitserver: p90_janitor_tasks_latency_failure_over_5m
+
+<p class="subtitle">90th percentile latency of failed tasks by type over 5m</p>
+
+The 90th percentile latency of failed housekeeping tasks, broken down by task type
+
+This panel has no related alerts.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100320` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+histogram_quantile(0.90, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="failure"}[5m])) by (le, housekeeping_task))
+```
+</details>
+
+<br />
+
+#### gitserver: p95_janitor_tasks_latency_failure_over_5m
+
+<p class="subtitle">95th percentile latency of failed tasks by type over 5m</p>
+
+The 95th percentile latency of failed housekeeping tasks, broken down by task type
+
+This panel has no related alerts.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100321` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+histogram_quantile(0.95, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="failure"}[5m])) by (le, housekeeping_task))
+```
+</details>
+
+<br />
+
+#### gitserver: p99_janitor_tasks_latency_failure_over_5m
+
+<p class="subtitle">99th percentile latency of failed tasks by type over 5m</p>
+
+The 99th percentile latency of failed housekeeping tasks, broken down by task type
+
+This panel has no related alerts.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100322` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+histogram_quantile(0.99, sum(rate(src_gitserver_janitor_tasks_latency_bucket{instance=~`${shard:regex}`, status="failure"}[5m])) by (le, housekeeping_task))
+```
+</details>
+
+<br />
+
+#### gitserver: pruned_files_total_over_5m
+
+<p class="subtitle">Files pruned by type over 5m</p>
+
+The rate of files pruned during cleanup, broken down by file type
+
+This panel has no related alerts.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100330` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+sum(rate(src_gitserver_janitor_pruned_files_total{instance=~`${shard:regex}`}[5m])) by (filetype)
+```
+</details>
+
+<br />
+
+#### gitserver: data_structure_count_over_5m
+
+<p class="subtitle">Data structure counts over 5m</p>
+
+The count distribution of various Git data structures in repositories
+
+This panel has no related alerts.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100340` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+histogram_quantile(0.95, sum(rate(src_gitserver_janitor_data_structure_count_bucket{instance=~`${shard:regex}`}[5m])) by (le, data_structure))
+```
+</details>
+
+<br />
+
+#### gitserver: janitor_data_structure_size
+
+<p class="subtitle">Data structure sizes</p>
+
+The size distribution of various Git data structures in repositories
+
+This panel has no related alerts.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100350` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+histogram_quantile(0.95, sum(rate(src_gitserver_janitor_data_structure_size_bucket{instance=~`${shard:regex}`}[5m])) by (le, data_structure))
+```
+</details>
+
+<br />
+
+#### gitserver: janitor_time_since_optimization
+
+<p class="subtitle">Time since last optimization</p>
+
+The time elapsed since last optimization of various Git data structures
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100260` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100360` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6625,7 +6832,7 @@ The rate at which data structures are reported to exist in repositories
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100270` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100370` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6653,7 +6860,7 @@ This metric helps track how often the retry mechanism is triggered.
 
 Refer to the [alerts reference](alerts#gitserver-git_command_retry_attempts_rate) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100300` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100400` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6678,7 +6885,7 @@ This indicates how effective the retry mechanism is at resolving transient corru
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100301` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100401` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6703,7 +6910,7 @@ These failures will result in repository corruption marking and potential reclon
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100310` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100410` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6729,7 +6936,7 @@ Common causes include network issues, permission changes, or concurrent reposito
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100311` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100411` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6755,7 +6962,7 @@ A low ratio may indicate persistent corruption issues requiring investigation.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100312` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100412` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6782,7 +6989,7 @@ A value of 0 indicates the routine isn`t running currently, it awaits it`s next
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100400` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100500` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -6807,7 +7014,7 @@ A low or zero value could indicate that a routine is stalled or encountering err
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100401` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100501` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -6832,7 +7039,7 @@ A sustained high error rate may indicate a problem with the routine`s configurat
 
 Refer to the [alerts reference](alerts#gitserver-goroutine_error_rate) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100410` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100510` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6857,7 +7064,7 @@ A value above 5% indicates that a significant portion of routine executions are
 
 Refer to the [alerts reference](alerts#gitserver-goroutine_error_percentage) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100411` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100511` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Services team.*</sub>
 
@@ -6873,6 +7080,32 @@ sum by (name, job_name) (rate(src_periodic_goroutine_errors_total{job=~".*gitser
 
 <br />
 
+#### gitserver: goroutine_error_percentage_long_window
+
+<p class="subtitle">Percentage of failed periodic goroutine executions over a long window</p>
+
+The percentage of failed executions over the last 6 hours for each periodic goroutine.
+A value above 30% sustained for at least 3 hours indicates persistent failures.
+A value above 50% sustained for at least 3 hours indicates that most executions are failing continuously.
+
+Refer to the [alerts reference](alerts#gitserver-goroutine_error_percentage_long_window) for 2 alerts related to this panel.
+
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100520` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+(sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*gitserver.*"}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total{job=~".*gitserver.*"}[6h])), 1)) * 100
+```
+</details>
+
+<br />
+
 #### gitserver: goroutine_handler_duration
 
 <p class="subtitle">95th percentile handler execution time</p>
@@ -6882,7 +7115,7 @@ Longer durations might indicate increased load or processing time.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100420` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100530` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -6907,7 +7140,7 @@ This represents how long a complete loop iteration takes before sleeping for the
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100421` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100531` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -6932,7 +7165,7 @@ Higher values indicate that tenant processing is taking longer and may affect ov
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100430` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100540` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -6957,7 +7190,7 @@ Consistently high values might indicate problematic tenants or inefficient proce
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100431` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100541` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -6982,7 +7215,7 @@ Unexpected changes can indicate tenant configuration issues or scaling events.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100440` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100550` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -7007,7 +7240,7 @@ A healthy routine should maintain a consistent processing rate.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100441` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100551` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -7032,7 +7265,7 @@ Consistent errors indicate problems with specific tenants.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100450` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100560` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -7057,7 +7290,7 @@ Values above 5% indicate significant tenant processing problems.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100451` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100561` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -7073,159 +7306,15 @@ Query:
 
 <br />
 
-### Git Server: Gitserver (CPU, Memory)
+### Git Server: Network I/O pod metrics (only available on Kubernetes)
 
-#### gitserver: cpu_usage_percentage
+#### gitserver: network_sent_bytes_aggregate
 
-<p class="subtitle">CPU usage</p>
+<p class="subtitle">Transmission rate over 5m (aggregate)</p>
 
-Refer to the [alerts reference](alerts#gitserver-cpu_usage_percentage) for 1 alert related to this panel.
+The rate of bytes sent over the network across all pods
 
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100500` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-cadvisor_container_cpu_usage_percentage_total{name=~"^gitserver.*"}
-```
-</details>
-
-<br />
-
-#### gitserver: memory_usage_percentage
-
-<p class="subtitle">Memory usage percentage (total)</p>
-
-An estimate for the active memory in use, which includes anonymous memory, file memory, and kernel memory. Some of this memory is reclaimable, so high usage does not necessarily indicate memory pressure.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100501` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-cadvisor_container_memory_usage_percentage_total{name=~"^gitserver.*"}
-```
-</details>
-
-<br />
-
-#### gitserver: memory_working_set_bytes
-
-<p class="subtitle">Memory usage bytes (total)</p>
-
-An estimate for the active memory in use in bytes, which includes anonymous memory, file memory, and kernel memory. Some of this memory is reclaimable, so high usage does not necessarily indicate memory pressure.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100502` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-max by (name) (container_memory_working_set_bytes{name=~"^gitserver.*"})
-```
-</details>
-
-<br />
-
-#### gitserver: memory_rss
-
-<p class="subtitle">Memory (RSS)</p>
-
-The total anonymous memory in use by the application, which includes Go stack and heap. This memory is is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS because to match the cadvisor name, but `anonymous` is more accurate."
-
-Refer to the [alerts reference](alerts#gitserver-memory_rss) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100510` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-max(container_memory_rss{name=~"^gitserver.*"} / container_spec_memory_limit_bytes{name=~"^gitserver.*"}) by (name) * 100.0 
-```
-</details>
-
-<br />
-
-#### gitserver: memory_total_active_file
-
-<p class="subtitle">Memory usage (active file)</p>
-
-This metric shows the total active file-backed memory currently in use by the application. Some of it may be reclaimable, so high usage does not necessarily indicate memory pressure.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100511` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-max(container_memory_total_active_file_bytes{name=~"^gitserver.*"} / container_spec_memory_limit_bytes{name=~"^gitserver.*"}) by (name) * 100.0 
-```
-</details>
-
-<br />
-
-#### gitserver: memory_kernel_usage
-
-<p class="subtitle">Memory usage (kernel)</p>
-
-The kernel usage metric shows the amount of memory used by the kernel on behalf of the application. Some of it may be reclaimable, so high usage does not necessarily indicate memory pressure.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100512` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-max(container_memory_kernel_usage{name=~"^gitserver.*"} / container_spec_memory_limit_bytes{name=~"^gitserver.*"}) by (name) * 100.0 
-```
-</details>
-
-<br />
-
-### Git Server: Network I/O pod metrics (only available on Kubernetes)
-
-#### gitserver: network_sent_bytes_aggregate
-
-<p class="subtitle">Transmission rate over 5m (aggregate)</p>
-
-The rate of bytes sent over the network across all pods
-
-This panel has no related alerts.
+This panel has no related alerts.
 
 To see this panel, visit `/-/debug/grafana/d/gitserver/gitserver?viewPanel=100600` on your Sourcegraph instance.
 
@@ -17130,6 +17219,32 @@ sum by (name, job_name) (rate(src_periodic_goroutine_errors_total{job=~".*worker
 
 <br />
 
+#### worker: goroutine_error_percentage_long_window
+
+<p class="subtitle">Percentage of failed periodic goroutine executions over a long window</p>
+
+The percentage of failed executions over the last 6 hours for each periodic goroutine.
+A value above 30% sustained for at least 3 hours indicates persistent failures.
+A value above 50% sustained for at least 3 hours indicates that most executions are failing continuously.
+
+Refer to the [alerts reference](alerts#worker-goroutine_error_percentage_long_window) for 2 alerts related to this panel.
+
+To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101820` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+(sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*worker.*"}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total{job=~".*worker.*"}[6h])), 1)) * 100
+```
+</details>
+
+<br />
+
 #### worker: goroutine_handler_duration
 
 <p class="subtitle">95th percentile handler execution time</p>
@@ -17139,7 +17254,7 @@ Longer durations might indicate increased load or processing time.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101820` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101830` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -17164,7 +17279,7 @@ This represents how long a complete loop iteration takes before sleeping for the
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101821` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101831` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -17189,7 +17304,7 @@ Higher values indicate that tenant processing is taking longer and may affect ov
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101830` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101840` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -17214,7 +17329,7 @@ Consistently high values might indicate problematic tenants or inefficient proce
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101831` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101841` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -17239,7 +17354,7 @@ Unexpected changes can indicate tenant configuration issues or scaling events.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101840` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101850` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -17264,7 +17379,7 @@ A healthy routine should maintain a consistent processing rate.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101841` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101851` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -17289,7 +17404,7 @@ Consistent errors indicate problems with specific tenants.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101850` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101860` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -17314,7 +17429,7 @@ Values above 5% indicate significant tenant processing problems.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101851` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/worker/worker?viewPanel=101861` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -17584,7 +17699,7 @@ max by (name) (container_memory_working_set_bytes{name=~"^worker.*"})
 
 <p class="subtitle">Memory (RSS)</p>
 
-The total anonymous memory in use by the application, which includes Go stack and heap. This memory is is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS because to match the cadvisor name, but `anonymous` is more accurate."
+The total anonymous memory in use by the application, which includes Go stack and heap. This memory is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS to match the cadvisor name, but "anonymous" is more accurate.
 
 Refer to the [alerts reference](alerts#worker-memory_rss) for 1 alert related to this panel.
 
@@ -20833,6 +20948,32 @@ sum by (name, job_name) (rate(src_periodic_goroutine_errors_total{job=~".*search
 
 <br />
 
+#### searcher: goroutine_error_percentage_long_window
+
+<p class="subtitle">Percentage of failed periodic goroutine executions over a long window</p>
+
+The percentage of failed executions over the last 6 hours for each periodic goroutine.
+A value above 30% sustained for at least 3 hours indicates persistent failures.
+A value above 50% sustained for at least 3 hours indicates that most executions are failing continuously.
+
+Refer to the [alerts reference](alerts#searcher-goroutine_error_percentage_long_window) for 2 alerts related to this panel.
+
+To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101420` on your Sourcegraph instance.
+
+<sub>*Managed by the Sourcegraph Services team.*</sub>
+
+<details>
+<summary>Technical details</summary>
+
+Query:
+
+```
+(sum by (name, job_name) (increase(src_periodic_goroutine_errors_total{job=~".*searcher.*"}[6h])) / clamp_min(sum by (name, job_name) (increase(src_periodic_goroutine_total{job=~".*searcher.*"}[6h])), 1)) * 100
+```
+</details>
+
+<br />
+
 #### searcher: goroutine_handler_duration
 
 <p class="subtitle">95th percentile handler execution time</p>
@@ -20842,7 +20983,7 @@ Longer durations might indicate increased load or processing time.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101420` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101430` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -20867,7 +21008,7 @@ This represents how long a complete loop iteration takes before sleeping for the
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101421` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101431` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -20892,7 +21033,7 @@ Higher values indicate that tenant processing is taking longer and may affect ov
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101430` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101440` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -20917,7 +21058,7 @@ Consistently high values might indicate problematic tenants or inefficient proce
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101431` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101441` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -20942,7 +21083,7 @@ Unexpected changes can indicate tenant configuration issues or scaling events.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101440` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101450` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -20967,7 +21108,7 @@ A healthy routine should maintain a consistent processing rate.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101441` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101451` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -20992,7 +21133,7 @@ Consistent errors indicate problems with specific tenants.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101450` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101460` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -21017,7 +21158,7 @@ Values above 5% indicate significant tenant processing problems.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101451` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/searcher/searcher?viewPanel=101461` on your Sourcegraph instance.
 
 <sub>*Managed by the Sourcegraph Platform team.*</sub>
 
@@ -21287,7 +21428,7 @@ max by (name) (container_memory_working_set_bytes{name=~"^searcher.*"})
 
 <p class="subtitle">Memory (RSS)</p>
 
-The total anonymous memory in use by the application, which includes Go stack and heap. This memory is is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS because to match the cadvisor name, but `anonymous` is more accurate."
+The total anonymous memory in use by the application, which includes Go stack and heap. This memory is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS to match the cadvisor name, but "anonymous" is more accurate.
 
 Refer to the [alerts reference](alerts#searcher-memory_rss) for 1 alert related to this panel.
 
@@ -21815,7 +21956,7 @@ max by (name) (container_memory_working_set_bytes{name=~"^syntect-server.*"})
 
 <p class="subtitle">Memory (RSS)</p>
 
-The total anonymous memory in use by the application, which includes Go stack and heap. This memory is is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS because to match the cadvisor name, but `anonymous` is more accurate."
+The total anonymous memory in use by the application, which includes Go stack and heap. This memory is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS to match the cadvisor name, but "anonymous" is more accurate.
 
 Refer to the [alerts reference](alerts#syntect-server-memory_rss) for 1 alert related to this panel.
 
@@ -22369,7 +22510,7 @@ max by (name) (container_memory_working_set_bytes{name=~"^zoekt-indexserver.*"})
 
 <p class="subtitle">Memory (RSS)</p>
 
-The total anonymous memory in use by the application, which includes Go stack and heap. This memory is is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS because to match the cadvisor name, but `anonymous` is more accurate."
+The total anonymous memory in use by the application, which includes Go stack and heap. This memory is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS to match the cadvisor name, but "anonymous" is more accurate.
 
 Refer to the [alerts reference](alerts#zoekt-memory_rss) for 1 alert related to this panel.
 
@@ -22439,6 +22580,19 @@ max(container_memory_kernel_usage{name=~"^zoekt-indexserver.*"} / container_spec
 
 ### Zoekt: Zoekt-webserver (CPU, Memory)
 
+Zoekt web server leverages memory mapping to optimize file reads: it is generally expected to consume all the memory provided to it, if it can. When it finds data that is not available in memory yet, this causes a 'page fault', and the data is loaded into memory from disk.
+
+A trend to watch out for: when something in-application happens to take a lot of memory, and active file previously used nearly all remaining memory, then:
+
+1. 'Memory (RSS)' goes up, due to in-application usage
+2. 'Memory usage (Active file)' goes down, as file data held in memory is evicted
+3. 'Page faults' go up, as less data is held in memory (and with that, IOPS, disk read throughput, ...)
+
+This can also happen without 'Memory (RSS)' increasing, if the provisioned memory is insufficent to start with.
+A small degree of this is behaviour generally expected, but if it happens significantly or causes user-noticeable impact, it's likely zoekt web server could benefit from more memory. Look for more user-facing metrics to make a final determination on appropriate resource allocation.
+
+_See https://en.wikipedia.org/wiki/Memory-mapped_file and the related articles for more information about memory maps._
+
 #### zoekt: cpu_usage_percentage
 
 <p class="subtitle">CPU usage</p>
@@ -22513,7 +22667,7 @@ max by (name) (container_memory_working_set_bytes{name=~"^zoekt-webserver.*"})
 
 <p class="subtitle">Memory (RSS)</p>
 
-The total anonymous memory in use by the application, which includes Go stack and heap. This memory is is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS because to match the cadvisor name, but `anonymous` is more accurate."
+The total anonymous memory in use by the application, which includes Go stack and heap. This memory is non-reclaimable, and high usage may trigger OOM kills. Note: the metric is named RSS to match the cadvisor name, but "anonymous" is more accurate.
 
 Refer to the [alerts reference](alerts#zoekt-memory_rss) for 1 alert related to this panel.
 
@@ -31886,1547 +32040,7 @@ This panel has no related alerts.
 
 To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101011` on your Sourcegraph instance.
 
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_hard_deleter_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_hard_deleter_errors_total
-
-<p class="subtitle">Job invocation operation errors every 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101012` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_hard_deleter_errors_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_hard_deleter_error_rate
-
-<p class="subtitle">Job invocation operation error rate over 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101013` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_hard_deleter_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_hard_deleter_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_hard_deleter_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
-```
-</details>
-
-<br />
-
-### Code Intelligence &gt; Uploads: Codeintel: Uploads &gt; Janitor task &gt; Codeintel uploads janitor audit logs
-
-#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_records_scanned_total
-
-<p class="subtitle">Records scanned every 5m</p>
-
-The number of candidate records considered for cleanup.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101100` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_codeintel_uploads_janitor_audit_logs_records_scanned_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_records_altered_total
-
-<p class="subtitle">Records altered every 5m</p>
-
-The number of candidate records altered as part of cleanup.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101101` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_codeintel_uploads_janitor_audit_logs_records_altered_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_total
-
-<p class="subtitle">Job invocation operations every 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101110` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_99th_percentile_duration
-
-<p class="subtitle">99th percentile successful job invocation operation duration over 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101111` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_janitor_audit_logs_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_errors_total
-
-<p class="subtitle">Job invocation operation errors every 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101112` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_errors_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_error_rate
-
-<p class="subtitle">Job invocation operation error rate over 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101113` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
-```
-</details>
-
-<br />
-
-### Code Intelligence &gt; Uploads: Codeintel: Uploads &gt; Janitor task &gt; Codeintel uploads janitor scip documents
-
-#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_records_scanned_total
-
-<p class="subtitle">Records scanned every 5m</p>
-
-The number of candidate records considered for cleanup.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101200` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_codeintel_uploads_janitor_scip_documents_records_scanned_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_records_altered_total
-
-<p class="subtitle">Records altered every 5m</p>
-
-The number of candidate records altered as part of cleanup.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101201` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_codeintel_uploads_janitor_scip_documents_records_altered_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_total
-
-<p class="subtitle">Job invocation operations every 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101210` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_99th_percentile_duration
-
-<p class="subtitle">99th percentile successful job invocation operation duration over 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101211` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_janitor_scip_documents_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_errors_total
-
-<p class="subtitle">Job invocation operation errors every 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101212` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_errors_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_error_rate
-
-<p class="subtitle">Job invocation operation error rate over 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101213` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
-```
-</details>
-
-<br />
-
-### Code Intelligence &gt; Uploads: Codeintel: Uploads &gt; Reconciler task &gt; Codeintel uploads reconciler scip metadata
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_records_scanned_total
-
-<p class="subtitle">Records scanned every 5m</p>
-
-The number of candidate records considered for cleanup.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101300` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_codeintel_uploads_reconciler_scip_metadata_records_scanned_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_records_altered_total
-
-<p class="subtitle">Records altered every 5m</p>
-
-The number of candidate records altered as part of cleanup.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101301` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_codeintel_uploads_reconciler_scip_metadata_records_altered_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_total
-
-<p class="subtitle">Job invocation operations every 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101310` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_99th_percentile_duration
-
-<p class="subtitle">99th percentile successful job invocation operation duration over 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101311` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_reconciler_scip_metadata_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_errors_total
-
-<p class="subtitle">Job invocation operation errors every 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101312` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_errors_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_error_rate
-
-<p class="subtitle">Job invocation operation error rate over 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101313` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
-```
-</details>
-
-<br />
-
-### Code Intelligence &gt; Uploads: Codeintel: Uploads &gt; Reconciler task &gt; Codeintel uploads reconciler scip data
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_records_scanned_total
-
-<p class="subtitle">Records scanned every 5m</p>
-
-The number of candidate records considered for cleanup.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101400` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_codeintel_uploads_reconciler_scip_data_records_scanned_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_records_altered_total
-
-<p class="subtitle">Records altered every 5m</p>
-
-The number of candidate records altered as part of cleanup.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101401` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_codeintel_uploads_reconciler_scip_data_records_altered_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_total
-
-<p class="subtitle">Job invocation operations every 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101410` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_99th_percentile_duration
-
-<p class="subtitle">99th percentile successful job invocation operation duration over 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101411` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_reconciler_scip_data_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_errors_total
-
-<p class="subtitle">Job invocation operation errors every 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101412` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_errors_total{job=~"^${source:regex}.*"}[5m]))
-```
-</details>
-
-<br />
-
-#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_error_rate
-
-<p class="subtitle">Job invocation operation error rate over 5m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101413` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
-```
-</details>
-
-<br />
-
-## Telemetry
-
-<p class="subtitle">Monitoring telemetry services in Sourcegraph.</p>
-
-To see this dashboard, visit `/-/debug/grafana/d/telemetry/telemetry` on your Sourcegraph instance.
-
-### Telemetry: Telemetry Gateway Exporter: Events export and queue metrics
-
-#### telemetry: telemetry_gateway_exporter_queue_size
-
-<p class="subtitle">Telemetry event payloads pending export</p>
-
-The number of events queued to be exported.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100000` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(src_telemetrygatewayexporter_queue_size)
-```
-</details>
-
-<br />
-
-#### telemetry: telemetry_gateway_exporter_queue_growth
-
-<p class="subtitle">Rate of growth of events export queue over 30m</p>
-
-A positive value indicates the queue is growing.
-
-Refer to the [alerts reference](alerts#telemetry-telemetry_gateway_exporter_queue_growth) for 2 alerts related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100001` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-max(deriv(src_telemetrygatewayexporter_queue_size[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: src_telemetrygatewayexporter_exported_events
-
-<p class="subtitle">Events exported from queue per hour</p>
-
-The number of events being exported.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100010` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-max(increase(src_telemetrygatewayexporter_exported_events[1h]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetry_gateway_exporter_batch_size
-
-<p class="subtitle">Number of events exported per batch over 30m</p>
-
-The number of events exported in each batch. The largest bucket is the maximum number of events exported per batch.
-If the distribution trends to the maximum bucket, then events export throughput is at or approaching saturation - try increasing  `TELEMETRY_GATEWAY_EXPORTER_EXPORT_BATCH_SIZE` or decreasing `TELEMETRY_GATEWAY_EXPORTER_EXPORT_INTERVAL`.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100011` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (le) (rate(src_telemetrygatewayexporter_batch_size_bucket[30m]))
-```
-</details>
-
-<br />
-
-### Telemetry: Telemetry Gateway Exporter: Events export job operations
-
-#### telemetry: telemetrygatewayexporter_exporter_total
-
-<p class="subtitle">Events exporter operations every 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100100` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_exporter_total{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_exporter_99th_percentile_duration
-
-<p class="subtitle">Aggregate successful events exporter operation duration distribution over 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100101` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum  by (le)(rate(src_telemetrygatewayexporter_exporter_duration_seconds_bucket{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_exporter_errors_total
-
-<p class="subtitle">Events exporter operation errors every 30m</p>
-
-Refer to the [alerts reference](alerts#telemetry-telemetrygatewayexporter_exporter_errors_total) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100102` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_exporter_errors_total{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_exporter_error_rate
-
-<p class="subtitle">Events exporter operation error rate over 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100103` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_exporter_errors_total{job=~"^worker.*"}[30m])) / (sum(increase(src_telemetrygatewayexporter_exporter_total{job=~"^worker.*"}[30m])) + sum(increase(src_telemetrygatewayexporter_exporter_errors_total{job=~"^worker.*"}[30m]))) * 100
-```
-</details>
-
-<br />
-
-### Telemetry: Telemetry Gateway Exporter: Events export queue cleanup job operations
-
-#### telemetry: telemetrygatewayexporter_queue_cleanup_total
-
-<p class="subtitle">Events export queue cleanup operations every 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100200` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_queue_cleanup_total{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_queue_cleanup_99th_percentile_duration
-
-<p class="subtitle">Aggregate successful events export queue cleanup operation duration distribution over 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100201` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum  by (le)(rate(src_telemetrygatewayexporter_queue_cleanup_duration_seconds_bucket{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_queue_cleanup_errors_total
-
-<p class="subtitle">Events export queue cleanup operation errors every 30m</p>
-
-Refer to the [alerts reference](alerts#telemetry-telemetrygatewayexporter_queue_cleanup_errors_total) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100202` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_queue_cleanup_errors_total{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_queue_cleanup_error_rate
-
-<p class="subtitle">Events export queue cleanup operation error rate over 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100203` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_queue_cleanup_errors_total{job=~"^worker.*"}[30m])) / (sum(increase(src_telemetrygatewayexporter_queue_cleanup_total{job=~"^worker.*"}[30m])) + sum(increase(src_telemetrygatewayexporter_queue_cleanup_errors_total{job=~"^worker.*"}[30m]))) * 100
-```
-</details>
-
-<br />
-
-### Telemetry: Telemetry Gateway Exporter: Events export queue metrics reporting job operations
-
-#### telemetry: telemetrygatewayexporter_queue_metrics_reporter_total
-
-<p class="subtitle">Events export backlog metrics reporting operations every 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100300` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_total{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_queue_metrics_reporter_99th_percentile_duration
-
-<p class="subtitle">Aggregate successful events export backlog metrics reporting operation duration distribution over 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100301` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum  by (le)(rate(src_telemetrygatewayexporter_queue_metrics_reporter_duration_seconds_bucket{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_queue_metrics_reporter_errors_total
-
-<p class="subtitle">Events export backlog metrics reporting operation errors every 30m</p>
-
-Refer to the [alerts reference](alerts#telemetry-telemetrygatewayexporter_queue_metrics_reporter_errors_total) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100302` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_errors_total{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_queue_metrics_reporter_error_rate
-
-<p class="subtitle">Events export backlog metrics reporting operation error rate over 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100303` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_errors_total{job=~"^worker.*"}[30m])) / (sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_total{job=~"^worker.*"}[30m])) + sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_errors_total{job=~"^worker.*"}[30m]))) * 100
-```
-</details>
-
-<br />
-
-### Telemetry: Telemetry persistence
-
-#### telemetry: telemetry_v2_export_queue_write_failures
-
-<p class="subtitle">Failed writes to events export queue over 5m</p>
-
-Telemetry V2 writes send events into the `telemetry_events_export_queue` for the exporter to periodically export.
-
-Refer to the [alerts reference](alerts#telemetry-telemetry_v2_export_queue_write_failures) for 2 alerts related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100400` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-(sum(increase(src_telemetry_export_store_queued_events{failed="true"}[5m])) / sum(increase(src_telemetry_export_store_queued_events[5m]))) * 100
-```
-</details>
-
-<br />
-
-#### telemetry: telemetry_v2_event_logs_write_failures
-
-<p class="subtitle">Failed write V2 events to V1 'event_logs' over 5m</p>
-
-Telemetry V2 writes also attempt to `tee` events into the legacy V1 events format in the `event_logs` database table for long-term local persistence.
-
-Refer to the [alerts reference](alerts#telemetry-telemetry_v2_event_logs_write_failures) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100401` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-(sum(increase(src_telemetry_teestore_v1_events{failed="true"}[5m])) / sum(increase(src_telemetry_teestore_v1_events[5m]))) * 100
-```
-</details>
-
-<br />
-
-### Telemetry: Telemetry Gateway Exporter: (off by default) User metadata export job operations
-
-#### telemetry: telemetrygatewayexporter_usermetadata_exporter_total
-
-<p class="subtitle">(off by default) user metadata exporter operations every 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100500` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_total{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_usermetadata_exporter_99th_percentile_duration
-
-<p class="subtitle">Aggregate successful (off by default) user metadata exporter operation duration distribution over 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100501` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum  by (le)(rate(src_telemetrygatewayexporter_usermetadata_exporter_duration_seconds_bucket{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_usermetadata_exporter_errors_total
-
-<p class="subtitle">(off by default) user metadata exporter operation errors every 30m</p>
-
-Refer to the [alerts reference](alerts#telemetry-telemetrygatewayexporter_usermetadata_exporter_errors_total) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100502` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_errors_total{job=~"^worker.*"}[30m]))
-```
-</details>
-
-<br />
-
-#### telemetry: telemetrygatewayexporter_usermetadata_exporter_error_rate
-
-<p class="subtitle">(off by default) user metadata exporter operation error rate over 30m</p>
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100503` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Services team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_errors_total{job=~"^worker.*"}[30m])) / (sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_total{job=~"^worker.*"}[30m])) + sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_errors_total{job=~"^worker.*"}[30m]))) * 100
-```
-</details>
-
-<br />
-
-## OpenTelemetry Collector
-
-<p class="subtitle">The OpenTelemetry collector ingests OpenTelemetry data from Sourcegraph and exports it to the configured backends.</p>
-
-To see this dashboard, visit `/-/debug/grafana/d/otel-collector/otel-collector` on your Sourcegraph instance.
-
-### OpenTelemetry Collector: Receivers
-
-#### otel-collector: otel_span_receive_rate
-
-<p class="subtitle">Spans received per receiver per minute</p>
-
-Shows the rate of spans accepted by the configured reveiver
-
-A Trace is a collection of spans and a span represents a unit of work or operation. Spans are the building blocks of Traces.
-The spans have only been accepted by the receiver, which means they still have to move through the configured pipeline to be exported.
-For more information on tracing and configuration of a OpenTelemetry receiver see https://opentelemetry.io/docs/collector/configuration/#receivers.
-
-See the Exporters section see spans that have made it through the pipeline and are exported.
-
-Depending the configured processors, received spans might be dropped and not exported. For more information on configuring processors see
-https://opentelemetry.io/docs/collector/configuration/#processors.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100000` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (receiver) (rate(otelcol_receiver_accepted_spans[1m]))
-```
-</details>
-
-<br />
-
-#### otel-collector: otel_span_refused
-
-<p class="subtitle">Spans refused per receiver</p>
-
-
-
-Refer to the [alerts reference](alerts#otel-collector-otel_span_refused) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100001` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (receiver) (rate(otelcol_receiver_refused_spans[1m]))
-```
-</details>
-
-<br />
-
-### OpenTelemetry Collector: Exporters
-
-#### otel-collector: otel_span_export_rate
-
-<p class="subtitle">Spans exported per exporter per minute</p>
-
-Shows the rate of spans being sent by the exporter
-
-A Trace is a collection of spans. A Span represents a unit of work or operation. Spans are the building blocks of Traces.
-The rate of spans here indicates spans that have made it through the configured pipeline and have been sent to the configured export destination.
-
-For more information on configuring a exporter for the OpenTelemetry collector see https://opentelemetry.io/docs/collector/configuration/#exporters.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100100` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (exporter) (rate(otelcol_exporter_sent_spans[1m]))
-```
-</details>
-
-<br />
-
-#### otel-collector: otel_span_export_failures
-
-<p class="subtitle">Span export failures by exporter</p>
-
-Shows the rate of spans failed to be sent by the configured reveiver. A number higher than 0 for a long period can indicate a problem with the exporter configuration or with the service that is being exported too
-
-For more information on configuring a exporter for the OpenTelemetry collector see https://opentelemetry.io/docs/collector/configuration/#exporters.
-
-Refer to the [alerts reference](alerts#otel-collector-otel_span_export_failures) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100101` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (exporter) (rate(otelcol_exporter_send_failed_spans[1m]))
-```
-</details>
-
-<br />
-
-### OpenTelemetry Collector: Queue Length
-
-#### otel-collector: otelcol_exporter_queue_capacity
-
-<p class="subtitle">Exporter queue capacity</p>
-
-Shows the the capacity of the retry queue (in batches).
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100200` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (exporter) (rate(otelcol_exporter_queue_capacity{job=~"^.*"}[1m]))
-```
-</details>
-
-<br />
-
-#### otel-collector: otelcol_exporter_queue_size
-
-<p class="subtitle">Exporter queue size</p>
-
-Shows the current size of retry queue
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100201` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (exporter) (rate(otelcol_exporter_queue_size{job=~"^.*"}[1m]))
-```
-</details>
-
-<br />
-
-#### otel-collector: otelcol_exporter_enqueue_failed_spans
-
-<p class="subtitle">Exporter enqueue failed spans</p>
-
-Shows the rate of spans failed to be enqueued by the configured exporter. A number higher than 0 for a long period can indicate a problem with the exporter configuration
-
-Refer to the [alerts reference](alerts#otel-collector-otelcol_exporter_enqueue_failed_spans) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100202` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (exporter) (rate(otelcol_exporter_enqueue_failed_spans{job=~"^.*"}[1m]))
-```
-</details>
-
-<br />
-
-### OpenTelemetry Collector: Processors
-
-#### otel-collector: otelcol_processor_dropped_spans
-
-<p class="subtitle">Spans dropped per processor per minute</p>
-
-Shows the rate of spans dropped by the configured processor
-
-Refer to the [alerts reference](alerts#otel-collector-otelcol_processor_dropped_spans) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100300` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (processor) (rate(otelcol_processor_dropped_spans[1m]))
-```
-</details>
-
-<br />
-
-### OpenTelemetry Collector: Collector resource usage
-
-#### otel-collector: otel_cpu_usage
-
-<p class="subtitle">Cpu usage of the collector</p>
-
-Shows CPU usage as reported by the OpenTelemetry collector.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100400` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (job) (rate(otelcol_process_cpu_seconds{job=~"^.*"}[1m]))
-```
-</details>
-
-<br />
-
-#### otel-collector: otel_memory_resident_set_size
-
-<p class="subtitle">Memory allocated to the otel collector</p>
-
-Shows the allocated memory Resident Set Size (RSS) as reported by the OpenTelemetry collector.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100401` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (job) (rate(otelcol_process_memory_rss{job=~"^.*"}[1m]))
-```
-</details>
-
-<br />
-
-#### otel-collector: otel_memory_usage
-
-<p class="subtitle">Memory used by the collector</p>
-
-Shows how much memory is being used by the otel collector.
-
-* High memory usage might indicate thad the configured pipeline is keeping a lot of spans in memory for processing
-* Spans failing to be sent and the exporter is configured to retry
-* A high batch count by using a batch processor
-
-For more information on configuring processors for the OpenTelemetry collector see https://opentelemetry.io/docs/collector/configuration/#processors.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100402` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by (job) (rate(otelcol_process_runtime_total_alloc_bytes{job=~"^.*"}[1m]))
-```
-</details>
-
-<br />
-
-### OpenTelemetry Collector: Container monitoring (not available on server)
-
-#### otel-collector: container_missing
-
-<p class="subtitle">Container missing</p>
-
-This value is the number of times a container has not been seen for more than one minute. If you observe this
-value change independent of deployment events (such as an upgrade), it could indicate pods are being OOM killed or terminated for some other reasons.
-
-- **Kubernetes:**
-	- Determine if the pod was OOM killed using `kubectl describe pod otel-collector` (look for `OOMKilled: true`) and, if so, consider increasing the memory limit in the relevant `Deployment.yaml`.
-	- Check the logs before the container restarted to see if there are `panic:` messages or similar using `kubectl logs -p otel-collector`.
-- **Docker Compose:**
-	- Determine if the pod was OOM killed using `docker inspect -f '\{\{json .State\}\}' otel-collector` (look for `"OOMKilled":true`) and, if so, consider increasing the memory limit of the otel-collector container in `docker-compose.yml`.
-	- Check the logs before the container restarted to see if there are `panic:` messages or similar using `docker logs otel-collector` (note this will include logs from the previous and currently running container).
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100500` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-count by(name) ((time() - container_last_seen{name=~"^otel-collector.*"}) > 60)
-```
-</details>
-
-<br />
-
-#### otel-collector: container_cpu_usage
-
-<p class="subtitle">Container cpu usage total (1m average) across all cores by instance</p>
-
-Refer to the [alerts reference](alerts#otel-collector-container_cpu_usage) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100501` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-cadvisor_container_cpu_usage_percentage_total{name=~"^otel-collector.*"}
-```
-</details>
-
-<br />
-
-#### otel-collector: container_memory_usage
-
-<p class="subtitle">Container memory usage by instance</p>
-
-Refer to the [alerts reference](alerts#otel-collector-container_memory_usage) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100502` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-cadvisor_container_memory_usage_percentage_total{name=~"^otel-collector.*"}
-```
-</details>
-
-<br />
-
-#### otel-collector: fs_io_operations
-
-<p class="subtitle">Filesystem reads and writes rate by instance over 1h</p>
-
-This value indicates the number of filesystem read and write operations by containers of this service.
-When extremely high, this can indicate a resource usage problem, or can cause problems with the service itself, especially if high values or spikes correlate with \{\{CONTAINER_NAME\}\} issues.
-
-This panel has no related alerts.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100503` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
-
-<details>
-<summary>Technical details</summary>
-
-Query:
-
-```
-sum by(name) (rate(container_fs_reads_total{name=~"^otel-collector.*"}[1h]) + rate(container_fs_writes_total{name=~"^otel-collector.*"}[1h]))
-```
-</details>
-
-<br />
-
-### OpenTelemetry Collector: Kubernetes monitoring (only available on Kubernetes)
-
-#### otel-collector: pods_available_percentage
-
-<p class="subtitle">Percentage pods available</p>
-
-Refer to the [alerts reference](alerts#otel-collector-pods_available_percentage) for 1 alert related to this panel.
-
-To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100600` on your Sourcegraph instance.
-
-<sub>*Managed by the Sourcegraph Platform team.*</sub>
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33434,30 +32048,21 @@ To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewP
 Query:
 
 ```
-sum by(app) (up{app=~".*otel-collector"}) / count by (app) (up{app=~".*otel-collector"}) * 100
+histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_hard_deleter_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
 ```
 </details>
 
 <br />
 
-## Completions
-
-<p class="subtitle">Cody chat and code completions.</p>
-
-To see this dashboard, visit `/-/debug/grafana/d/completions/completions` on your Sourcegraph instance.
-
-### Completions: Completions requests
-
-#### completions: api_request_rate
-
-<p class="subtitle">Rate of completions API requests</p>
+#### codeintel-uploads: codeintel_uploads_hard_deleter_errors_total
 
-Rate (QPS) of requests to cody chat and code completion endpoints.
+<p class="subtitle">Job invocation operation errors every 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100000` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101012` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33465,24 +32070,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-sum by (code)(irate(src_http_request_duration_seconds_count{route=~"^cody.completions.*"}[5m]))
+sum by (op)(increase(src_codeintel_uploads_hard_deleter_errors_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-### Completions: Chat completions
-
-#### completions: chat_completions_p99_stream_duration
-
-<p class="subtitle">Stream: total time (p99)</p>
+#### codeintel-uploads: codeintel_uploads_hard_deleter_error_rate
 
-Time spent on the Stream() invocation, i.e. how long results take to connect, stream results, and finish streaming.
+<p class="subtitle">Job invocation operation error rate over 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100100` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101013` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33490,22 +32092,25 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_stream_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum by (op)(increase(src_codeintel_uploads_hard_deleter_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_hard_deleter_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_hard_deleter_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p95_stream_duration
+### Code Intelligence &gt; Uploads: Codeintel: Uploads &gt; Janitor task &gt; Codeintel uploads janitor audit logs
+
+#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_records_scanned_total
 
-<p class="subtitle">Stream: total time (p95)</p>
+<p class="subtitle">Records scanned every 5m</p>
 
-Time spent on the Stream() invocation, i.e. how long results take to connect, stream results, and finish streaming.
+The number of candidate records considered for cleanup.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100101` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101100` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33513,22 +32118,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_stream_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum(increase(src_codeintel_uploads_janitor_audit_logs_records_scanned_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p75_stream_duration
+#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_records_altered_total
 
-<p class="subtitle">Stream: total time (p75)</p>
+<p class="subtitle">Records altered every 5m</p>
 
-Time spent on the Stream() invocation, i.e. how long results take to connect, stream results, and finish streaming.
+The number of candidate records altered as part of cleanup.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100102` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101101` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33536,22 +32142,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_stream_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum(increase(src_codeintel_uploads_janitor_audit_logs_records_altered_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p50_stream_duration
-
-<p class="subtitle">Stream: total time (p50)</p>
+#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_total
 
-Time spent on the Stream() invocation, i.e. how long results take to connect, stream results, and finish streaming.
+<p class="subtitle">Job invocation operations every 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100103` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101110` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33559,22 +32164,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_stream_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p99_non_stream_overhead_duration
-
-<p class="subtitle">Non-stream overhead (p99)</p>
+#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_99th_percentile_duration
 
-Time between Go HTTP handler invocation and Stream() invocation, overhead of e.g. request validation, routing to gateway/other, model resolution, error reporting/tracing, guardrails, etc.
+<p class="subtitle">99th percentile successful job invocation operation duration over 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100110` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101111` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33582,22 +32186,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_handler_overhead_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le,model))
+histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_janitor_audit_logs_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p95_non_stream_overhead_duration
-
-<p class="subtitle">Non-stream overhead (p95)</p>
+#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_errors_total
 
-Time between Go HTTP handler invocation and Stream() invocation, overhead of e.g. request validation, routing to gateway/other, model resolution, error reporting/tracing, guardrails, etc.
+<p class="subtitle">Job invocation operation errors every 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100111` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101112` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33605,22 +32208,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_handler_overhead_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le,model))
+sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_errors_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p75_non_stream_overhead_duration
-
-<p class="subtitle">Non-stream overhead (p75)</p>
+#### codeintel-uploads: codeintel_uploads_janitor_audit_logs_error_rate
 
-Time between Go HTTP handler invocation and Stream() invocation, overhead of e.g. request validation, routing to gateway/other, model resolution, error reporting/tracing, guardrails, etc.
+<p class="subtitle">Job invocation operation error rate over 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100112` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101113` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33628,22 +32230,25 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_handler_overhead_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le,model))
+sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_janitor_audit_logs_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p50_non_stream_overhead_duration
+### Code Intelligence &gt; Uploads: Codeintel: Uploads &gt; Janitor task &gt; Codeintel uploads janitor scip documents
+
+#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_records_scanned_total
 
-<p class="subtitle">Non-stream overhead (p50)</p>
+<p class="subtitle">Records scanned every 5m</p>
 
-Time between Go HTTP handler invocation and Stream() invocation, overhead of e.g. request validation, routing to gateway/other, model resolution, error reporting/tracing, guardrails, etc.
+The number of candidate records considered for cleanup.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100113` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101200` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33651,22 +32256,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_handler_overhead_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le,model))
+sum(increase(src_codeintel_uploads_janitor_scip_documents_records_scanned_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p99_stream_first_event_duration
+#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_records_altered_total
 
-<p class="subtitle">Stream: time to first event (p99)</p>
+<p class="subtitle">Records altered every 5m</p>
 
-Time between calling Stream(), the client connecting to the server etc. and actually getting the first streaming event back.
+The number of candidate records altered as part of cleanup.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100120` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101201` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33674,22 +32280,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_stream_first_event_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum(increase(src_codeintel_uploads_janitor_scip_documents_records_altered_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p95_stream_first_event_duration
-
-<p class="subtitle">Stream: time to first event (p95)</p>
+#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_total
 
-Time between calling Stream(), the client connecting to the server etc. and actually getting the first streaming event back.
+<p class="subtitle">Job invocation operations every 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100121` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101210` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33697,22 +32302,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_stream_first_event_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p75_stream_first_event_duration
-
-<p class="subtitle">Stream: time to first event (p75)</p>
+#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_99th_percentile_duration
 
-Time between calling Stream(), the client connecting to the server etc. and actually getting the first streaming event back.
+<p class="subtitle">99th percentile successful job invocation operation duration over 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100122` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101211` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33720,22 +32324,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_stream_first_event_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_janitor_scip_documents_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p50_stream_first_event_duration
-
-<p class="subtitle">Stream: time to first event (p50)</p>
+#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_errors_total
 
-Time between calling Stream(), the client connecting to the server etc. and actually getting the first streaming event back.
+<p class="subtitle">Job invocation operation errors every 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100123` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101212` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33743,22 +32346,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_stream_first_event_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_errors_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p99_upstream_roundtrip_duration
-
-<p class="subtitle">Stream: first byte sent -> received (p99)</p>
+#### codeintel-uploads: codeintel_uploads_janitor_scip_documents_error_rate
 
-Time between sending the first byte to the upstream, and then getting the first byte back from the upstream.
+<p class="subtitle">Job invocation operation error rate over 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100130` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101213` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33766,22 +32368,25 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_roundtrip_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, provider))
+sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_janitor_scip_documents_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p95_upstream_roundtrip_duration
+### Code Intelligence &gt; Uploads: Codeintel: Uploads &gt; Reconciler task &gt; Codeintel uploads reconciler scip metadata
+
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_records_scanned_total
 
-<p class="subtitle">Stream: first byte sent -> received (p95)</p>
+<p class="subtitle">Records scanned every 5m</p>
 
-Time between sending the first byte to the upstream, and then getting the first byte back from the upstream.
+The number of candidate records considered for cleanup.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100131` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101300` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33789,22 +32394,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_roundtrip_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, provider))
+sum(increase(src_codeintel_uploads_reconciler_scip_metadata_records_scanned_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p75_upstream_roundtrip_duration
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_records_altered_total
 
-<p class="subtitle">Stream: first byte sent -> received (p75)</p>
+<p class="subtitle">Records altered every 5m</p>
 
-Time between sending the first byte to the upstream, and then getting the first byte back from the upstream.
+The number of candidate records altered as part of cleanup.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100132` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101301` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33812,22 +32418,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_roundtrip_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, provider))
+sum(increase(src_codeintel_uploads_reconciler_scip_metadata_records_altered_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p50_upstream_roundtrip_duration
-
-<p class="subtitle">Stream: first byte sent -> received (p50)</p>
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_total
 
-Time between sending the first byte to the upstream, and then getting the first byte back from the upstream.
+<p class="subtitle">Job invocation operations every 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100133` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101310` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33835,22 +32440,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_roundtrip_duration_seconds_bucket{feature="chat_completions",model=~'${model}'}[$sampling_duration])) by (le, provider))
+sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p99_http_connect_total
-
-<p class="subtitle">Stream: HTTP connect: total (p99)</p>
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_99th_percentile_duration
 
-Time spent acquiring an HTTP connection to the upstream, either from an existing pool OR by performing DNS resolution, TCP connection, etc.
+<p class="subtitle">99th percentile successful job invocation operation duration over 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100140` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101311` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33858,22 +32462,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_connection_total_duration_seconds_bucket[$sampling_duration])) by (le, connection_type, provider))
+histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_reconciler_scip_metadata_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p95_http_connect_total
-
-<p class="subtitle">Stream: HTTP connect: total (p95)</p>
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_errors_total
 
-Time spent acquiring an HTTP connection to the upstream, either from an existing pool OR by performing DNS resolution, TCP connection, etc.
+<p class="subtitle">Job invocation operation errors every 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100141` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101312` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33881,22 +32484,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_connection_total_duration_seconds_bucket[$sampling_duration])) by (le, connection_type, provider))
+sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_errors_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p75_http_connect_total
-
-<p class="subtitle">Stream: HTTP connect: total (p75)</p>
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_metadata_error_rate
 
-Time spent acquiring an HTTP connection to the upstream, either from an existing pool OR by performing DNS resolution, TCP connection, etc.
+<p class="subtitle">Job invocation operation error rate over 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100142` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101313` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33904,22 +32506,25 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_connection_total_duration_seconds_bucket[$sampling_duration])) by (le, connection_type, provider))
+sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_reconciler_scip_metadata_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p50_http_connect_total
+### Code Intelligence &gt; Uploads: Codeintel: Uploads &gt; Reconciler task &gt; Codeintel uploads reconciler scip data
+
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_records_scanned_total
 
-<p class="subtitle">Stream: HTTP connect: total (p50)</p>
+<p class="subtitle">Records scanned every 5m</p>
 
-Time spent acquiring an HTTP connection to the upstream, either from an existing pool OR by performing DNS resolution, TCP connection, etc.
+The number of candidate records considered for cleanup.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100143` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101400` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33927,22 +32532,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_connection_total_duration_seconds_bucket[$sampling_duration])) by (le, connection_type, provider))
+sum(increase(src_codeintel_uploads_reconciler_scip_data_records_scanned_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p99_http_connect_dns
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_records_altered_total
 
-<p class="subtitle">Stream: HTTP connect: dns (p99)</p>
+<p class="subtitle">Records altered every 5m</p>
 
-Portion of time spent on DNS when acquiring an HTTP connection to the upstream.
+The number of candidate records altered as part of cleanup.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100150` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101401` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33950,22 +32556,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_connection_dns_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum(increase(src_codeintel_uploads_reconciler_scip_data_records_altered_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p95_http_connect_dns
-
-<p class="subtitle">Stream: HTTP connect: dns (p95)</p>
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_total
 
-Portion of time spent on DNS when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Job invocation operations every 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100151` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101410` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33973,22 +32578,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_connection_dns_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p75_http_connect_dns
-
-<p class="subtitle">Stream: HTTP connect: dns (p75)</p>
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_99th_percentile_duration
 
-Portion of time spent on DNS when acquiring an HTTP connection to the upstream.
+<p class="subtitle">99th percentile successful job invocation operation duration over 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100152` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101411` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -33996,22 +32600,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_connection_dns_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+histogram_quantile(0.99, sum  by (le,op)(rate(src_codeintel_uploads_reconciler_scip_data_duration_seconds_bucket{job=~"^${source:regex}.*"}[5m])))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p50_http_connect_dns
-
-<p class="subtitle">Stream: HTTP connect: dns (p50)</p>
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_errors_total
 
-Portion of time spent on DNS when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Job invocation operation errors every 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100153` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101412` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34019,22 +32622,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_connection_dns_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_errors_total{job=~"^${source:regex}.*"}[5m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p99_http_connect_tls
-
-<p class="subtitle">Stream: HTTP connect: tls (p99)</p>
+#### codeintel-uploads: codeintel_uploads_reconciler_scip_data_error_rate
 
-Portion of time spent on TLS when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Job invocation operation error rate over 5m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100160` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/codeintel-uploads/codeintel-uploads?viewPanel=101413` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Code Understanding team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34042,22 +32644,31 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_connection_tls_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_errors_total{job=~"^${source:regex}.*"}[5m])) / (sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_total{job=~"^${source:regex}.*"}[5m])) + sum by (op)(increase(src_codeintel_uploads_reconciler_scip_data_errors_total{job=~"^${source:regex}.*"}[5m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p95_http_connect_tls
+## Telemetry
+
+<p class="subtitle">Monitoring telemetry services in Sourcegraph.</p>
+
+To see this dashboard, visit `/-/debug/grafana/d/telemetry/telemetry` on your Sourcegraph instance.
+
+### Telemetry: Telemetry Gateway Exporter: Events export and queue metrics
+
+#### telemetry: telemetry_gateway_exporter_queue_size
 
-<p class="subtitle">Stream: HTTP connect: tls (p95)</p>
+<p class="subtitle">Telemetry event payloads pending export</p>
 
-Portion of time spent on TLS when acquiring an HTTP connection to the upstream.
+The number of events queued to be exported.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100161` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100000` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34065,22 +32676,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_connection_tls_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum(src_telemetrygatewayexporter_queue_size)
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p75_http_connect_tls
+#### telemetry: telemetry_gateway_exporter_queue_growth
 
-<p class="subtitle">Stream: HTTP connect: tls (p75)</p>
+<p class="subtitle">Rate of growth of events export queue over 30m</p>
 
-Portion of time spent on TLS when acquiring an HTTP connection to the upstream.
+A positive value indicates the queue is growing.
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#telemetry-telemetry_gateway_exporter_queue_growth) for 2 alerts related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100162` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100001` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34088,22 +32700,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_connection_tls_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+max(deriv(src_telemetrygatewayexporter_queue_size[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p50_http_connect_tls
+#### telemetry: src_telemetrygatewayexporter_exported_events
 
-<p class="subtitle">Stream: HTTP connect: tls (p50)</p>
+<p class="subtitle">Events exported from queue per hour</p>
 
-Portion of time spent on TLS when acquiring an HTTP connection to the upstream.
+The number of events being exported.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100163` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100010` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34111,22 +32724,24 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_connection_tls_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+max(increase(src_telemetrygatewayexporter_exported_events[1h]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p99_http_connect_dial
+#### telemetry: telemetry_gateway_exporter_batch_size
 
-<p class="subtitle">Stream: HTTP connect: dial (p99)</p>
+<p class="subtitle">Number of events exported per batch over 30m</p>
 
-Portion of time spent on golang Dial() when acquiring an HTTP connection to the upstream.
+The number of events exported in each batch. The largest bucket is the maximum number of events exported per batch.
+If the distribution trends to the maximum bucket, then events export throughput is at or approaching saturation - try increasing  `TELEMETRY_GATEWAY_EXPORTER_EXPORT_BATCH_SIZE` or decreasing `TELEMETRY_GATEWAY_EXPORTER_EXPORT_INTERVAL`.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100170` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100011` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34134,22 +32749,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_connection_dial_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (le) (rate(src_telemetrygatewayexporter_batch_size_bucket[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p95_http_connect_dial
+### Telemetry: Telemetry Gateway Exporter: Events export job operations
 
-<p class="subtitle">Stream: HTTP connect: dial (p95)</p>
+#### telemetry: telemetrygatewayexporter_exporter_total
 
-Portion of time spent on golang Dial() when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Events exporter operations every 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100171` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100100` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34157,22 +32773,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_connection_dial_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum(increase(src_telemetrygatewayexporter_exporter_total{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p75_http_connect_dial
-
-<p class="subtitle">Stream: HTTP connect: dial (p75)</p>
+#### telemetry: telemetrygatewayexporter_exporter_99th_percentile_duration
 
-Portion of time spent on golang Dial() when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Aggregate successful events exporter operation duration distribution over 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100172` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100101` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34180,22 +32795,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_connection_dial_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum  by (le)(rate(src_telemetrygatewayexporter_exporter_duration_seconds_bucket{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: chat_completions_p50_http_connect_dial
-
-<p class="subtitle">Stream: HTTP connect: dial (p50)</p>
+#### telemetry: telemetrygatewayexporter_exporter_errors_total
 
-Portion of time spent on golang Dial() when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Events exporter operation errors every 30m</p>
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#telemetry-telemetrygatewayexporter_exporter_errors_total) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100173` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100102` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34203,24 +32817,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_connection_dial_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum(increase(src_telemetrygatewayexporter_exporter_errors_total{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-### Completions: Code completions
-
-#### completions: code_completions_p99_stream_duration
-
-<p class="subtitle">Stream: total time (p99)</p>
+#### telemetry: telemetrygatewayexporter_exporter_error_rate
 
-Time spent on the Stream() invocation, i.e. how long results take to connect, stream results, and finish streaming.
+<p class="subtitle">Events exporter operation error rate over 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100200` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100103` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34228,22 +32839,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_stream_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum(increase(src_telemetrygatewayexporter_exporter_errors_total{job=~"^worker.*"}[30m])) / (sum(increase(src_telemetrygatewayexporter_exporter_total{job=~"^worker.*"}[30m])) + sum(increase(src_telemetrygatewayexporter_exporter_errors_total{job=~"^worker.*"}[30m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p95_stream_duration
+### Telemetry: Telemetry Gateway Exporter: Events export queue cleanup job operations
 
-<p class="subtitle">Stream: total time (p95)</p>
+#### telemetry: telemetrygatewayexporter_queue_cleanup_total
 
-Time spent on the Stream() invocation, i.e. how long results take to connect, stream results, and finish streaming.
+<p class="subtitle">Events export queue cleanup operations every 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100201` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100200` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34251,22 +32863,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_stream_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum(increase(src_telemetrygatewayexporter_queue_cleanup_total{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p75_stream_duration
-
-<p class="subtitle">Stream: total time (p75)</p>
+#### telemetry: telemetrygatewayexporter_queue_cleanup_99th_percentile_duration
 
-Time spent on the Stream() invocation, i.e. how long results take to connect, stream results, and finish streaming.
+<p class="subtitle">Aggregate successful events export queue cleanup operation duration distribution over 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100202` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100201` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34274,22 +32885,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_stream_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum  by (le)(rate(src_telemetrygatewayexporter_queue_cleanup_duration_seconds_bucket{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p50_stream_duration
-
-<p class="subtitle">Stream: total time (p50)</p>
+#### telemetry: telemetrygatewayexporter_queue_cleanup_errors_total
 
-Time spent on the Stream() invocation, i.e. how long results take to connect, stream results, and finish streaming.
+<p class="subtitle">Events export queue cleanup operation errors every 30m</p>
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#telemetry-telemetrygatewayexporter_queue_cleanup_errors_total) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100203` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100202` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34297,22 +32907,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_stream_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum(increase(src_telemetrygatewayexporter_queue_cleanup_errors_total{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p99_non_stream_overhead_duration
-
-<p class="subtitle">Non-stream overhead (p99)</p>
+#### telemetry: telemetrygatewayexporter_queue_cleanup_error_rate
 
-Time between Go HTTP handler invocation and Stream() invocation, overhead of e.g. request validation, routing to gateway/other, model resolution, error reporting/tracing, guardrails, etc.
+<p class="subtitle">Events export queue cleanup operation error rate over 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100210` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100203` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34320,22 +32929,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_handler_overhead_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le,model))
+sum(increase(src_telemetrygatewayexporter_queue_cleanup_errors_total{job=~"^worker.*"}[30m])) / (sum(increase(src_telemetrygatewayexporter_queue_cleanup_total{job=~"^worker.*"}[30m])) + sum(increase(src_telemetrygatewayexporter_queue_cleanup_errors_total{job=~"^worker.*"}[30m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p95_non_stream_overhead_duration
+### Telemetry: Telemetry Gateway Exporter: Events export queue metrics reporting job operations
 
-<p class="subtitle">Non-stream overhead (p95)</p>
+#### telemetry: telemetrygatewayexporter_queue_metrics_reporter_total
 
-Time between Go HTTP handler invocation and Stream() invocation, overhead of e.g. request validation, routing to gateway/other, model resolution, error reporting/tracing, guardrails, etc.
+<p class="subtitle">Events export backlog metrics reporting operations every 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100211` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100300` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34343,22 +32953,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_handler_overhead_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le,model))
+sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_total{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p75_non_stream_overhead_duration
-
-<p class="subtitle">Non-stream overhead (p75)</p>
+#### telemetry: telemetrygatewayexporter_queue_metrics_reporter_99th_percentile_duration
 
-Time between Go HTTP handler invocation and Stream() invocation, overhead of e.g. request validation, routing to gateway/other, model resolution, error reporting/tracing, guardrails, etc.
+<p class="subtitle">Aggregate successful events export backlog metrics reporting operation duration distribution over 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100212` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100301` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34366,22 +32975,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_handler_overhead_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le,model))
+sum  by (le)(rate(src_telemetrygatewayexporter_queue_metrics_reporter_duration_seconds_bucket{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p50_non_stream_overhead_duration
-
-<p class="subtitle">Non-stream overhead (p50)</p>
+#### telemetry: telemetrygatewayexporter_queue_metrics_reporter_errors_total
 
-Time between Go HTTP handler invocation and Stream() invocation, overhead of e.g. request validation, routing to gateway/other, model resolution, error reporting/tracing, guardrails, etc.
+<p class="subtitle">Events export backlog metrics reporting operation errors every 30m</p>
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#telemetry-telemetrygatewayexporter_queue_metrics_reporter_errors_total) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100213` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100302` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34389,22 +32997,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_handler_overhead_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le,model))
+sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_errors_total{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p99_stream_first_event_duration
-
-<p class="subtitle">Stream: time to first event (p99)</p>
+#### telemetry: telemetrygatewayexporter_queue_metrics_reporter_error_rate
 
-Time between calling Stream(), the client connecting to the server etc. and actually getting the first streaming event back.
+<p class="subtitle">Events export backlog metrics reporting operation error rate over 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100220` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100303` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34412,22 +33019,25 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_stream_first_event_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_errors_total{job=~"^worker.*"}[30m])) / (sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_total{job=~"^worker.*"}[30m])) + sum(increase(src_telemetrygatewayexporter_queue_metrics_reporter_errors_total{job=~"^worker.*"}[30m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p95_stream_first_event_duration
+### Telemetry: Telemetry persistence
 
-<p class="subtitle">Stream: time to first event (p95)</p>
+#### telemetry: telemetry_v2_export_queue_write_failures
 
-Time between calling Stream(), the client connecting to the server etc. and actually getting the first streaming event back.
+<p class="subtitle">Failed writes to events export queue over 5m</p>
 
-This panel has no related alerts.
+Telemetry V2 writes send events into the `telemetry_events_export_queue` for the exporter to periodically export.
+
+Refer to the [alerts reference](alerts#telemetry-telemetry_v2_export_queue_write_failures) for 2 alerts related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100221` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100400` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34435,22 +33045,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_stream_first_event_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+(sum(increase(src_telemetry_export_store_queued_events{failed="true"}[5m])) / sum(increase(src_telemetry_export_store_queued_events[5m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p75_stream_first_event_duration
+#### telemetry: telemetry_v2_event_logs_write_failures
 
-<p class="subtitle">Stream: time to first event (p75)</p>
+<p class="subtitle">Failed write V2 events to V1 'event_logs' over 5m</p>
 
-Time between calling Stream(), the client connecting to the server etc. and actually getting the first streaming event back.
+Telemetry V2 writes also attempt to `tee` events into the legacy V1 events format in the `event_logs` database table for long-term local persistence.
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#telemetry-telemetry_v2_event_logs_write_failures) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100222` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100401` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34458,22 +33069,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_stream_first_event_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+(sum(increase(src_telemetry_teestore_v1_events{failed="true"}[5m])) / sum(increase(src_telemetry_teestore_v1_events[5m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p50_stream_first_event_duration
+### Telemetry: Telemetry Gateway Exporter: (off by default) User metadata export job operations
 
-<p class="subtitle">Stream: time to first event (p50)</p>
+#### telemetry: telemetrygatewayexporter_usermetadata_exporter_total
 
-Time between calling Stream(), the client connecting to the server etc. and actually getting the first streaming event back.
+<p class="subtitle">(off by default) user metadata exporter operations every 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100223` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100500` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34481,22 +33093,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_stream_first_event_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, model))
+sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_total{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p99_upstream_roundtrip_duration
-
-<p class="subtitle">Stream: first byte sent -> received (p99)</p>
+#### telemetry: telemetrygatewayexporter_usermetadata_exporter_99th_percentile_duration
 
-Time between sending the first byte to the upstream, and then getting the first byte back from the upstream.
+<p class="subtitle">Aggregate successful (off by default) user metadata exporter operation duration distribution over 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100230` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100501` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34504,22 +33115,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_roundtrip_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, provider))
+sum  by (le)(rate(src_telemetrygatewayexporter_usermetadata_exporter_duration_seconds_bucket{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p95_upstream_roundtrip_duration
-
-<p class="subtitle">Stream: first byte sent -> received (p95)</p>
+#### telemetry: telemetrygatewayexporter_usermetadata_exporter_errors_total
 
-Time between sending the first byte to the upstream, and then getting the first byte back from the upstream.
+<p class="subtitle">(off by default) user metadata exporter operation errors every 30m</p>
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#telemetry-telemetrygatewayexporter_usermetadata_exporter_errors_total) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100231` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100502` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34527,22 +33137,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_roundtrip_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, provider))
+sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_errors_total{job=~"^worker.*"}[30m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p75_upstream_roundtrip_duration
-
-<p class="subtitle">Stream: first byte sent -> received (p75)</p>
+#### telemetry: telemetrygatewayexporter_usermetadata_exporter_error_rate
 
-Time between sending the first byte to the upstream, and then getting the first byte back from the upstream.
+<p class="subtitle">(off by default) user metadata exporter operation error rate over 30m</p>
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100232` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/telemetry/telemetry?viewPanel=100503` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Services team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34550,22 +33159,40 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_roundtrip_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, provider))
+sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_errors_total{job=~"^worker.*"}[30m])) / (sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_total{job=~"^worker.*"}[30m])) + sum(increase(src_telemetrygatewayexporter_usermetadata_exporter_errors_total{job=~"^worker.*"}[30m]))) * 100
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p50_upstream_roundtrip_duration
+## OpenTelemetry Collector
+
+<p class="subtitle">The OpenTelemetry collector ingests OpenTelemetry data from Sourcegraph and exports it to the configured backends.</p>
+
+To see this dashboard, visit `/-/debug/grafana/d/otel-collector/otel-collector` on your Sourcegraph instance.
+
+### OpenTelemetry Collector: Receivers
+
+#### otel-collector: otel_span_receive_rate
+
+<p class="subtitle">Spans received per receiver per minute</p>
+
+Shows the rate of spans accepted by the configured reveiver
+
+A Trace is a collection of spans and a span represents a unit of work or operation. Spans are the building blocks of Traces.
+The spans have only been accepted by the receiver, which means they still have to move through the configured pipeline to be exported.
+For more information on tracing and configuration of a OpenTelemetry receiver see https://opentelemetry.io/docs/collector/configuration/#receivers.
 
-<p class="subtitle">Stream: first byte sent -> received (p50)</p>
+See the Exporters section see spans that have made it through the pipeline and are exported.
 
-Time between sending the first byte to the upstream, and then getting the first byte back from the upstream.
+Depending the configured processors, received spans might be dropped and not exported. For more information on configuring processors see
+https://opentelemetry.io/docs/collector/configuration/#processors.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100233` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100000` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34573,22 +33200,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_roundtrip_duration_seconds_bucket{feature="code_completions",model=~'${model}'}[$sampling_duration])) by (le, provider))
+sum by (receiver) (rate(otelcol_receiver_accepted_spans[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p99_http_connect_total
+#### otel-collector: otel_span_refused
+
+<p class="subtitle">Spans refused per receiver</p>
 
-<p class="subtitle">Stream: HTTP connect: total (p99)</p>
 
-Time spent acquiring an HTTP connection to the upstream, either from an existing pool OR by performing DNS resolution, TCP connection, etc.
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#otel-collector-otel_span_refused) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100240` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100001` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34596,22 +33224,30 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_connection_total_duration_seconds_bucket[$sampling_duration])) by (le, connection_type, provider))
+sum by (receiver) (rate(otelcol_receiver_refused_spans[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p95_http_connect_total
+### OpenTelemetry Collector: Exporters
+
+#### otel-collector: otel_span_export_rate
+
+<p class="subtitle">Spans exported per exporter per minute</p>
+
+Shows the rate of spans being sent by the exporter
 
-<p class="subtitle">Stream: HTTP connect: total (p95)</p>
+A Trace is a collection of spans. A Span represents a unit of work or operation. Spans are the building blocks of Traces.
+The rate of spans here indicates spans that have made it through the configured pipeline and have been sent to the configured export destination.
 
-Time spent acquiring an HTTP connection to the upstream, either from an existing pool OR by performing DNS resolution, TCP connection, etc.
+For more information on configuring a exporter for the OpenTelemetry collector see https://opentelemetry.io/docs/collector/configuration/#exporters.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100241` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100100` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34619,22 +33255,25 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_connection_total_duration_seconds_bucket[$sampling_duration])) by (le, connection_type, provider))
+sum by (exporter) (rate(otelcol_exporter_sent_spans[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p75_http_connect_total
+#### otel-collector: otel_span_export_failures
 
-<p class="subtitle">Stream: HTTP connect: total (p75)</p>
+<p class="subtitle">Span export failures by exporter</p>
 
-Time spent acquiring an HTTP connection to the upstream, either from an existing pool OR by performing DNS resolution, TCP connection, etc.
+Shows the rate of spans failed to be sent by the configured reveiver. A number higher than 0 for a long period can indicate a problem with the exporter configuration or with the service that is being exported too
 
-This panel has no related alerts.
+For more information on configuring a exporter for the OpenTelemetry collector see https://opentelemetry.io/docs/collector/configuration/#exporters.
+
+Refer to the [alerts reference](alerts#otel-collector-otel_span_export_failures) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100242` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100101` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34642,22 +33281,25 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_connection_total_duration_seconds_bucket[$sampling_duration])) by (le, connection_type, provider))
+sum by (exporter) (rate(otelcol_exporter_send_failed_spans[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p50_http_connect_total
+### OpenTelemetry Collector: Queue Length
+
+#### otel-collector: otelcol_exporter_queue_capacity
 
-<p class="subtitle">Stream: HTTP connect: total (p50)</p>
+<p class="subtitle">Exporter queue capacity</p>
 
-Time spent acquiring an HTTP connection to the upstream, either from an existing pool OR by performing DNS resolution, TCP connection, etc.
+Shows the the capacity of the retry queue (in batches).
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100243` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100200` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34665,22 +33307,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_connection_total_duration_seconds_bucket[$sampling_duration])) by (le, connection_type, provider))
+sum by (exporter) (rate(otelcol_exporter_queue_capacity{job=~"^.*"}[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p99_http_connect_dns
+#### otel-collector: otelcol_exporter_queue_size
 
-<p class="subtitle">Stream: HTTP connect: dns (p99)</p>
+<p class="subtitle">Exporter queue size</p>
 
-Portion of time spent on DNS when acquiring an HTTP connection to the upstream.
+Shows the current size of retry queue
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100250` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100201` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34688,22 +33331,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_connection_dns_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (exporter) (rate(otelcol_exporter_queue_size{job=~"^.*"}[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p95_http_connect_dns
+#### otel-collector: otelcol_exporter_enqueue_failed_spans
 
-<p class="subtitle">Stream: HTTP connect: dns (p95)</p>
+<p class="subtitle">Exporter enqueue failed spans</p>
 
-Portion of time spent on DNS when acquiring an HTTP connection to the upstream.
+Shows the rate of spans failed to be enqueued by the configured exporter. A number higher than 0 for a long period can indicate a problem with the exporter configuration
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#otel-collector-otelcol_exporter_enqueue_failed_spans) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100251` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100202` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34711,22 +33355,25 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_connection_dns_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (exporter) (rate(otelcol_exporter_enqueue_failed_spans{job=~"^.*"}[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p75_http_connect_dns
+### OpenTelemetry Collector: Processors
 
-<p class="subtitle">Stream: HTTP connect: dns (p75)</p>
+#### otel-collector: otelcol_processor_dropped_spans
 
-Portion of time spent on DNS when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Spans dropped per processor per minute</p>
 
-This panel has no related alerts.
+Shows the rate of spans dropped by the configured processor
+
+Refer to the [alerts reference](alerts#otel-collector-otelcol_processor_dropped_spans) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100252` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100300` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34734,22 +33381,25 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_connection_dns_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (processor) (rate(otelcol_processor_dropped_spans[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p50_http_connect_dns
+### OpenTelemetry Collector: Collector resource usage
+
+#### otel-collector: otel_cpu_usage
 
-<p class="subtitle">Stream: HTTP connect: dns (p50)</p>
+<p class="subtitle">Cpu usage of the collector</p>
 
-Portion of time spent on DNS when acquiring an HTTP connection to the upstream.
+Shows CPU usage as reported by the OpenTelemetry collector.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100253` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100400` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34757,22 +33407,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_connection_dns_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (job) (rate(otelcol_process_cpu_seconds{job=~"^.*"}[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p99_http_connect_tls
+#### otel-collector: otel_memory_resident_set_size
 
-<p class="subtitle">Stream: HTTP connect: tls (p99)</p>
+<p class="subtitle">Memory allocated to the otel collector</p>
 
-Portion of time spent on TLS when acquiring an HTTP connection to the upstream.
+Shows the allocated memory Resident Set Size (RSS) as reported by the OpenTelemetry collector.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100260` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100401` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34780,22 +33431,29 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_connection_tls_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (job) (rate(otelcol_process_memory_rss{job=~"^.*"}[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p95_http_connect_tls
+#### otel-collector: otel_memory_usage
+
+<p class="subtitle">Memory used by the collector</p>
+
+Shows how much memory is being used by the otel collector.
 
-<p class="subtitle">Stream: HTTP connect: tls (p95)</p>
+* High memory usage might indicate thad the configured pipeline is keeping a lot of spans in memory for processing
+* Spans failing to be sent and the exporter is configured to retry
+* A high batch count by using a batch processor
 
-Portion of time spent on TLS when acquiring an HTTP connection to the upstream.
+For more information on configuring processors for the OpenTelemetry collector see https://opentelemetry.io/docs/collector/configuration/#processors.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100261` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100402` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34803,22 +33461,33 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_connection_tls_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (job) (rate(otelcol_process_runtime_total_alloc_bytes{job=~"^.*"}[1m]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p75_http_connect_tls
+### OpenTelemetry Collector: Container monitoring (not available on server)
+
+#### otel-collector: container_missing
+
+<p class="subtitle">Container missing</p>
 
-<p class="subtitle">Stream: HTTP connect: tls (p75)</p>
+This value is the number of times a container has not been seen for more than one minute. If you observe this
+value change independent of deployment events (such as an upgrade), it could indicate pods are being OOM killed or terminated for some other reasons.
 
-Portion of time spent on TLS when acquiring an HTTP connection to the upstream.
+- **Kubernetes:**
+	- Determine if the pod was OOM killed using `kubectl describe pod otel-collector` (look for `OOMKilled: true`) and, if so, consider increasing the memory limit in the relevant `Deployment.yaml`.
+	- Check the logs before the container restarted to see if there are `panic:` messages or similar using `kubectl logs -p otel-collector`.
+- **Docker Compose:**
+	- Determine if the pod was OOM killed using `docker inspect -f '\{\{json .State\}\}' otel-collector` (look for `"OOMKilled":true`) and, if so, consider increasing the memory limit of the otel-collector container in `docker-compose.yml`.
+	- Check the logs before the container restarted to see if there are `panic:` messages or similar using `docker logs otel-collector` (note this will include logs from the previous and currently running container).
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100262` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100500` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34826,22 +33495,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_connection_tls_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+count by(name) ((time() - container_last_seen{name=~"^otel-collector.*"}) > 60)
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p50_http_connect_tls
-
-<p class="subtitle">Stream: HTTP connect: tls (p50)</p>
+#### otel-collector: container_cpu_usage
 
-Portion of time spent on TLS when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Container cpu usage total (1m average) across all cores by instance</p>
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#otel-collector-container_cpu_usage) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100263` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100501` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34849,22 +33517,21 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_connection_tls_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+cadvisor_container_cpu_usage_percentage_total{name=~"^otel-collector.*"}
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p99_http_connect_dial
-
-<p class="subtitle">Stream: HTTP connect: dial (p99)</p>
+#### otel-collector: container_memory_usage
 
-Portion of time spent on golang Dial() when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Container memory usage by instance</p>
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#otel-collector-container_memory_usage) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100270` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100502` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34872,22 +33539,24 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.99, sum(rate(src_completions_upstream_connection_dial_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+cadvisor_container_memory_usage_percentage_total{name=~"^otel-collector.*"}
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p95_http_connect_dial
+#### otel-collector: fs_io_operations
 
-<p class="subtitle">Stream: HTTP connect: dial (p95)</p>
+<p class="subtitle">Filesystem reads and writes rate by instance over 1h</p>
 
-Portion of time spent on golang Dial() when acquiring an HTTP connection to the upstream.
+This value indicates the number of filesystem read and write operations by containers of this service.
+When extremely high, this can indicate a resource usage problem, or can cause problems with the service itself, especially if high values or spikes correlate with \{\{CONTAINER_NAME\}\} issues.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100271` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100503` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34895,22 +33564,23 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.95, sum(rate(src_completions_upstream_connection_dial_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by(name) (rate(container_fs_reads_total{name=~"^otel-collector.*"}[1h]) + rate(container_fs_writes_total{name=~"^otel-collector.*"}[1h]))
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p75_http_connect_dial
+### OpenTelemetry Collector: Kubernetes monitoring (only available on Kubernetes)
 
-<p class="subtitle">Stream: HTTP connect: dial (p75)</p>
+#### otel-collector: pods_available_percentage
 
-Portion of time spent on golang Dial() when acquiring an HTTP connection to the upstream.
+<p class="subtitle">Percentage pods available</p>
 
-This panel has no related alerts.
+Refer to the [alerts reference](alerts#otel-collector-pods_available_percentage) for 1 alert related to this panel.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100272` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/otel-collector/otel-collector?viewPanel=100600` on your Sourcegraph instance.
 
+<sub>*Managed by the Sourcegraph Platform team.*</sub>
 
 <details>
 <summary>Technical details</summary>
@@ -34918,21 +33588,29 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.75, sum(rate(src_completions_upstream_connection_dial_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by(app) (up{app=~".*otel-collector"}) / count by (app) (up{app=~".*otel-collector"}) * 100
 ```
 </details>
 
 <br />
 
-#### completions: code_completions_p50_http_connect_dial
+## Completions
+
+<p class="subtitle">Cody chat and code completions.</p>
+
+To see this dashboard, visit `/-/debug/grafana/d/completions/completions` on your Sourcegraph instance.
+
+### Completions: Completions requests
+
+#### completions: api_request_rate
 
-<p class="subtitle">Stream: HTTP connect: dial (p50)</p>
+<p class="subtitle">Rate of completions API requests</p>
 
-Portion of time spent on golang Dial() when acquiring an HTTP connection to the upstream.
+Rate (QPS) of requests to cody chat and code completion endpoints.
 
 This panel has no related alerts.
 
-To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100273` on your Sourcegraph instance.
+To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=100000` on your Sourcegraph instance.
 
 
 <details>
@@ -34941,7 +33619,7 @@ To see this panel, visit `/-/debug/grafana/d/completions/completions?viewPanel=1
 Query:
 
 ```
-histogram_quantile(0.50, sum(rate(src_completions_upstream_connection_dial_duration_seconds_bucket[$sampling_duration])) by (le, provider))
+sum by (code)(irate(src_http_request_duration_seconds_count{route=~"^cody.completions.*"}[5m]))
 ```
 </details>