gitpod/components/server/src/prometheus-metrics.ts
Milan Pavlik 495ed8e6c3
[server] Set JWT cookie on sign-in WEB-100 (#17200)
* [server] Set JWT cookie on sign-in

* retest

* Fix

* retest

* Fix

* fix

* fix

* Fix

* also clear jwt cookie

* align max age with config

* Fix
2023-04-17 18:35:49 +08:00

248 lines
8.4 KiB
TypeScript

/**
* Copyright (c) 2021 Gitpod GmbH. All rights reserved.
* Licensed under the GNU Affero General Public License (AGPL).
* See License.AGPL.txt in the project root for license information.
*/
import * as prometheusClient from "prom-client";
export function registerServerMetrics(registry: prometheusClient.Registry) {
registry.registerMetric(loginCounter);
registry.registerMetric(apiConnectionCounter);
registry.registerMetric(apiConnectionClosedCounter);
registry.registerMetric(apiCallCounter);
registry.registerMetric(apiCallDurationHistogram);
registry.registerMetric(httpRequestTotal);
registry.registerMetric(httpRequestDuration);
registry.registerMetric(messagebusTopicReads);
registry.registerMetric(gitpodVersionInfo);
registry.registerMetric(instanceStartsSuccessTotal);
registry.registerMetric(instanceStartsFailedTotal);
registry.registerMetric(prebuildsStartedTotal);
registry.registerMetric(stripeClientRequestsCompletedDurationSeconds);
registry.registerMetric(imageBuildsStartedTotal);
registry.registerMetric(imageBuildsCompletedTotal);
registry.registerMetric(centralizedPermissionsValidationsTotal);
registry.registerMetric(spicedbClientLatency);
registry.registerMetric(dashboardErrorBoundary);
registry.registerMetric(jwtCookieIssued);
}
const loginCounter = new prometheusClient.Counter({
name: "gitpod_server_login_requests_total",
help: "Total amount of login requests",
labelNames: ["status", "auth_host"],
});
type LoginCounterStatus =
// The login attempt failed due to a system error (picked up by alerts)
| "failed"
// The login attempt succeeded
| "succeeded"
// The login attempt failed, because the client failed to provide complete session information, for instance.
| "failed_client";
export function increaseLoginCounter(status: LoginCounterStatus, auth_host: string) {
loginCounter.inc({
status,
auth_host,
});
}
const apiConnectionCounter = new prometheusClient.Counter({
name: "gitpod_server_api_connections_total",
help: "Total amount of established API connections",
});
export function increaseApiConnectionCounter() {
apiConnectionCounter.inc();
}
const jwtCookieIssued = new prometheusClient.Counter({
name: "gitpod_server_jwt_cookie_issued_total",
help: "Total number of JWT cookies issued for login sessions",
});
export function reportJWTCookieIssued() {
jwtCookieIssued.inc();
}
const apiConnectionClosedCounter = new prometheusClient.Counter({
name: "gitpod_server_api_connections_closed_total",
help: "Total amount of closed API connections",
});
export function increaseApiConnectionClosedCounter() {
apiConnectionClosedCounter.inc();
}
const apiCallCounter = new prometheusClient.Counter({
name: "gitpod_server_api_calls_total",
help: "Total amount of API calls per method",
labelNames: ["method", "statusCode"],
});
export function increaseApiCallCounter(method: string, statusCode: number) {
apiCallCounter.inc({ method, statusCode });
}
export const apiCallDurationHistogram = new prometheusClient.Histogram({
name: "gitpod_server_api_calls_duration_seconds",
help: "Duration of API calls in seconds",
labelNames: ["method", "statusCode"],
buckets: [0.1, 0.5, 1, 5, 10, 15, 30],
});
export function observeAPICallsDuration(method: string, statusCode: number, duration: number) {
apiCallDurationHistogram.observe({ method, statusCode }, duration);
}
const httpRequestTotal = new prometheusClient.Counter({
name: "gitpod_server_http_requests_total",
help: "Total amount of HTTP requests per express route",
labelNames: ["method", "route", "statusCode"],
});
export function increaseHttpRequestCounter(method: string, route: string, statusCode: number) {
httpRequestTotal.inc({ method, route, statusCode });
}
const httpRequestDuration = new prometheusClient.Histogram({
name: "gitpod_server_http_request_duration_seconds",
help: "Duration of HTTP requests in seconds",
labelNames: ["method", "route", "statusCode"],
buckets: [0.01, 0.05, 0.1, 0.5, 1, 5, 10],
});
export function observeHttpRequestDuration(
method: string,
route: string,
statusCode: number,
durationInSeconds: number,
) {
httpRequestDuration.observe({ method, route, statusCode }, durationInSeconds);
}
const messagebusTopicReads = new prometheusClient.Counter({
name: "gitpod_server_topic_reads_total",
help: "The amount of reads from messagebus topics.",
labelNames: ["topic"],
});
export function increaseMessagebusTopicReads(topic: string) {
messagebusTopicReads.inc({
topic,
});
}
const gitpodVersionInfo = new prometheusClient.Gauge({
name: "gitpod_version_info",
help: "Gitpod's version",
labelNames: ["gitpod_version"],
});
export function setGitpodVersion(gitpod_version: string) {
gitpodVersionInfo.set({ gitpod_version }, 1);
}
const instanceStartsSuccessTotal = new prometheusClient.Counter({
name: "gitpod_server_instance_starts_success_total",
help: "Total amount of successfully performed instance starts",
labelNames: ["retries"],
});
export function increaseSuccessfulInstanceStartCounter(retries: number = 0) {
instanceStartsSuccessTotal.inc({ retries });
}
const instanceStartsFailedTotal = new prometheusClient.Counter({
name: "gitpod_server_instance_starts_failed_total",
help: "Total amount of failed performed instance starts",
labelNames: ["reason"],
});
export type FailedInstanceStartReason =
| "clusterSelectionFailed"
| "startOnClusterFailed"
| "imageBuildFailed"
| "resourceExhausted"
| "other";
export function increaseFailedInstanceStartCounter(reason: FailedInstanceStartReason) {
instanceStartsFailedTotal.inc({ reason });
}
const prebuildsStartedTotal = new prometheusClient.Counter({
name: "gitpod_prebuilds_started_total",
help: "Counter of total prebuilds started.",
});
export function increasePrebuildsStartedCounter() {
prebuildsStartedTotal.inc();
}
export const stripeClientRequestsCompletedDurationSeconds = new prometheusClient.Histogram({
name: "gitpod_server_stripe_client_requests_completed_duration_seconds",
help: "Completed stripe client requests, by outcome and operation",
labelNames: ["operation", "outcome"],
});
export function observeStripeClientRequestsCompleted(operation: string, outcome: string, durationInSeconds: number) {
stripeClientRequestsCompletedDurationSeconds.observe({ operation, outcome }, durationInSeconds);
}
export const imageBuildsStartedTotal = new prometheusClient.Counter({
name: "gitpod_server_image_builds_started_total",
help: "counter of the total number of image builds started on server",
});
export function increaseImageBuildsStartedTotal() {
imageBuildsStartedTotal.inc();
}
export const imageBuildsCompletedTotal = new prometheusClient.Counter({
name: "gitpod_server_image_builds_completed_total",
help: "counter of the total number of image builds recorded as completed on server",
labelNames: ["outcome"],
});
export function increaseImageBuildsCompletedTotal(outcome: "succeeded" | "failed") {
imageBuildsCompletedTotal.inc({ outcome });
}
const centralizedPermissionsValidationsTotal = new prometheusClient.Counter({
name: "gitpod_perms_centralized_validations_total",
help: "counter of centralized permission checks validations against existing system",
labelNames: ["operation", "matches_expectation"],
});
export function reportCentralizedPermsValidation(operation: string, matches: boolean) {
centralizedPermissionsValidationsTotal.inc({ operation, matches_expectation: String(matches) });
}
export const spicedbClientLatency = new prometheusClient.Histogram({
name: "gitpod_spicedb_client_requests_completed_seconds",
help: "Histogram of completed spicedb client requests",
labelNames: ["operation", "permission", "outcome"],
});
export function observespicedbClientLatency(
operation: string,
permission: string,
outcome: Error | undefined,
durationInSeconds: number,
) {
spicedbClientLatency.observe(
{ operation, permission, outcome: outcome === undefined ? "success" : "error" },
durationInSeconds,
);
}
export const dashboardErrorBoundary = new prometheusClient.Counter({
name: "gitpod_dashboard_error_boundary_total",
help: "Total number of errors caught by an error boundary in the dashboard",
});
export function increaseDashboardErrorBoundaryCounter() {
dashboardErrorBoundary.inc();
}