Skip to content
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
7 changes: 4 additions & 3 deletions .github/workflows/_graph_proxy_container.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -34,8 +34,9 @@ jobs:
with:
images: ${{ env.IMAGE_REPOSITORY }}
tags: |
type=raw,value=${{ steps.tags.outputs.version }}
type=raw,value=latest
type=raw,value=${{ steps.tags.outputs.version }},enable=${{ startsWith(github.ref, 'refs/tags/graph-proxy@') }}
type=raw,value=latest,enable=${{ startsWith(github.ref, 'refs/tags/graph-proxy@') }}
type=raw,value=${{ github.ref_name }}

- name: Set up Docker Buildx
uses: docker/setup-buildx-action@v3.11.1
Expand All @@ -47,7 +48,7 @@ jobs:
context: backend
file: backend/Dockerfile.graph-proxy
target: deploy
push: ${{ github.event_name == 'push' && startsWith(github.ref, 'refs/tags/graph-proxy@') }}
push: ${{ github.event_name == 'push' }}
load: ${{ !(github.event_name == 'push' && startsWith(github.ref, 'refs/tags/graph-proxy@')) }}
tags: ${{ steps.meta.outputs.tags }}
labels: ${{ steps.meta.outputs.labels }}
Expand Down
37 changes: 32 additions & 5 deletions backend/graph-proxy/src/graphql/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -116,7 +116,9 @@ pub async fn graphql_handler(
auth_token_header: Option<TypedHeader<Authorization<Bearer>>>,
request: GraphQLRequest,
) -> GraphQLResponse {
let start = std::time::Instant::now();
let query = request.into_inner();
let mut request_type = "unparseable";

if let Ok(query) = parse_query(&query.query) {
let operation = query.operations;
Expand All @@ -130,19 +132,24 @@ pub async fn graphql_handler(
.map(|operation| operation.1.node.ty)
.collect(),
};
let mut has_mutation = false;
for operation in operations {
match operation {
async_graphql::parser::types::OperationType::Query => state
.metrics_state
.total_requests
.add(1, &[KeyValue::new("request_type", "query")]),
async_graphql::parser::types::OperationType::Mutation => state
.metrics_state
.total_requests
.add(1, &[KeyValue::new("request_type", "mutation")]),
async_graphql::parser::types::OperationType::Mutation => {
has_mutation = true;
state
.metrics_state
.total_requests
.add(1, &[KeyValue::new("request_type", "mutation")])
}
async_graphql::parser::types::OperationType::Subscription => {}
};
}
request_type = if has_mutation { "mutation" } else { "query" };
} else {
state
.metrics_state
Expand All @@ -151,7 +158,27 @@ pub async fn graphql_handler(
};

let auth_token = auth_token_header.map(|header| header.0);
state.schema.execute(query.data(auth_token)).await.into()
let response = state.schema.execute(query.data(auth_token)).await;
let elapsed_ms = start.elapsed().as_secs_f64() * 1000.0;
let status = if response.errors.is_empty() {
"ok"
} else {
"error"
};
if status == "error" {
state
.metrics_state
.total_errors
.add(1, &[KeyValue::new("status", "error")]);
};
state.metrics_state.request_duration_ms.record(
elapsed_ms,
&[
KeyValue::new("request_type", request_type),
KeyValue::new("status", status),
],
);
response.into()
}

lazy_static! {
Expand Down
23 changes: 21 additions & 2 deletions backend/graph-proxy/src/metrics.rs
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
use std::sync::Arc;

use opentelemetry::metrics::{Counter, MeterProvider};
use opentelemetry::metrics::{Counter, Histogram, MeterProvider};
use opentelemetry_sdk::metrics::SdkMeterProvider;

/// Thread-safe wrapper for OTEL metrics
Expand All @@ -11,6 +11,10 @@ pub type MetricsState = Arc<Metrics>;
pub struct Metrics {
/// Total requests on all routes
pub total_requests: Counter<u64>,
/// Request duration in miliseconds on every request
pub request_duration_ms: Histogram<f64>,
/// Total errors on query and mutation
pub total_errors: Counter<u64>,
}

impl Metrics {
Expand All @@ -23,6 +27,21 @@ impl Metrics {
.with_description("The total requests on all routes made since the last restart.")
.build();

Metrics { total_requests }
let request_duration_ms = meter
.f64_histogram("graph_proxy_request_duration_ms")
.with_description("GraphQL request duration")
.with_unit("ms")
.build();

let total_errors = meter
.u64_counter("graph_proxy_total_errors")
.with_description("The total number of errors since the last restart.")
.build();

Metrics {
total_requests,
request_duration_ms,
total_errors,
}
}
}
4 changes: 1 addition & 3 deletions charts/workflows/Chart.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -2,9 +2,7 @@ apiVersion: v2
name: workflows
description: Data Analysis workflow orchestration
type: application

version: 0.13.35

version: 0.13.36
dependencies:
- name: argo-workflows
repository: https://argoproj.github.io/argo-helm
Expand Down
4 changes: 4 additions & 0 deletions charts/workflows/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,10 @@ argo-workflows:
bucket: k8s-workflows-test
region: unsupported
controller:
metricsConfig:
enabled: true
secure: false
scheme: http
replicas: 2
podAnnotations:
prometheus.io/scrape: "true"
Expand Down
Loading