groups: - interval: 2m30s name: slo-onprem-rpc-increase rules: - expr: sum by (cluster, rpc_connect_rpc_error_code, rpc_method, rpc_service) (increase(rpc_server_duration_count[1h])) labels: slo: slo-onprem-rpc record: rpc_server_duration:increase1h - expr: sum by (cluster, rpc_connect_rpc_error_code, rpc_method, rpc_service) (increase(rpc_server_duration_count[12h])) labels: slo: slo-onprem-rpc record: rpc_server_duration:increase12h - expr: sum by (cluster, rpc_connect_rpc_error_code, rpc_method, rpc_service) (increase(rpc_server_duration_count[1d])) labels: slo: slo-onprem-rpc record: rpc_server_duration:increase1d - expr: sum by (cluster, rpc_connect_rpc_error_code, rpc_method, rpc_service) (increase(rpc_server_duration_count[1w])) labels: slo: slo-onprem-rpc record: rpc_server_duration:increase1w - expr: sum by (cluster, rpc_connect_rpc_error_code, rpc_method, rpc_service) (increase(rpc_server_duration_count[4w])) labels: slo: slo-onprem-rpc record: rpc_server_duration:increase4w - interval: 30s name: slo-onprem-rpc rules: - expr: sum by (cluster, rpc_method, rpc_service) (rate(rpc_server_duration_bucket{rpc_connect_rpc_error_code=~"internal|unavailable|data_loss|unknown"}[5m])) / sum by (cluster, rpc_method, rpc_service) (rate(rpc_server_duration_count[5m])) labels: slo: slo-onprem-rpc record: rpc_server_duration:burnrate5m - expr: sum by (cluster, rpc_method, rpc_service) (rate(rpc_server_duration_bucket{rpc_connect_rpc_error_code=~"internal|unavailable|data_loss|unknown"}[1h])) / sum by (cluster, rpc_method, rpc_service) (rate(rpc_server_duration_count[1h])) labels: slo: slo-onprem-rpc record: rpc_server_duration:burnrate1h - expr: sum by (cluster, rpc_method, rpc_service) (rate(rpc_server_duration_bucket{rpc_connect_rpc_error_code=~"internal|unavailable|data_loss|unknown"}[2h])) / sum by (cluster, rpc_method, rpc_service) (rate(rpc_server_duration_count[2h])) labels: slo: slo-onprem-rpc record: rpc_server_duration:burnrate2h - expr: sum by (cluster, rpc_method, rpc_service) (rate(rpc_server_duration_bucket{rpc_connect_rpc_error_code=~"internal|unavailable|data_loss|unknown"}[1d])) / sum by (cluster, rpc_method, rpc_service) (rate(rpc_server_duration_count[1d])) labels: slo: slo-onprem-rpc record: rpc_server_duration:burnrate1d - interval: 1m0s name: slo-onprem-rpc-latency-increase rules: - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1h])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="250000",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1h])) labels: latency: "250000" record: rpc_server_duration_bucket:slow1h - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[12h])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="250000",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[12h])) labels: latency: "250000" record: rpc_server_duration_bucket:slow12h - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1d])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="250000",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1d])) labels: latency: "250000" record: rpc_server_duration_bucket:slow1d - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1w])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="250000",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1w])) labels: latency: "250000" record: rpc_server_duration_bucket:slow1w - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[4w])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="250000",rpc_service=~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[4w])) labels: latency: "250000" record: rpc_server_duration_bucket:slow4w - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1h])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="15000",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1h])) labels: latency: "15000" record: rpc_server_duration_bucket:fast1h - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[12h])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="15000",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[12h])) labels: latency: "15000" record: rpc_server_duration_bucket:fast12h - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1d])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="15000",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1d])) labels: latency: "15000" record: rpc_server_duration_bucket:fast1d - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1w])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="15000",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[1w])) labels: latency: "15000" record: rpc_server_duration_bucket:fast1w - expr: sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="+Inf",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[4w])) - sum by (cluster, rpc_service, rpc_method) (increase(rpc_server_duration_bucket{le="15000",rpc_service!~"buf.alpha.registry.v1alpha1.CodeGenerationService|buf.alpha.javacompile.v1alpha1.CompileService|buf.alpha.registry.v1alpha1.GenerateService|buf.alpha.sandbox.v1alpha1.SandboxService"}[4w])) labels: latency: "15000" record: rpc_server_duration_bucket:fast4w - expr: (histogram_quantile(0.99, sum by (cluster, rpc_service, rpc_method, le) (rate(rpc_server_duration_bucket[4m])))) labels: percentile: p99 record: rpc_server_duration_bucket:histogram_quantile - expr: (histogram_quantile(0.95, sum by (cluster, rpc_service, rpc_method, le) (rate(rpc_server_duration_bucket[4m])))) labels: percentile: p95 record: rpc_server_duration_bucket:histogram_quantile - expr: (histogram_quantile(0.5, sum by (cluster, rpc_service, rpc_method, le) (rate(rpc_server_duration_bucket[4m])))) labels: percentile: p50 record: rpc_server_duration_bucket:histogram_quantile