Skip to content

Commit

Permalink
Add monitorType JMX
Browse files Browse the repository at this point in the history
  • Loading branch information
alaturqua committed Sep 17, 2024
1 parent 785844b commit 82cf53d
Show file tree
Hide file tree
Showing 5 changed files with 176 additions and 1 deletion.
19 changes: 19 additions & 0 deletions docs/installation.md
Original file line number Diff line number Diff line change
Expand Up @@ -331,6 +331,25 @@ supported for legacy reasons and may be deprecated in the future. It is only
supported for backend clusters with `web-ui.authentication.type = PASSWORD`. Set
a username and password using `backendState` as with the `JDBC` option.

#### JMX

This pulls cluster information from the `v1/jmx/mbean` endpoint utilizing following
metrics:
- `trino.execution:name=QueryManager`
- `trino.metadata:name=DiscoveryNodeManager`

Configure a username and password by adding `backendState` to your configuration.
The username and password must be valid across all clusters. User requires
`read` rights on `system_information` on all clusters.

```yaml
backendState:
username: "user"
password: "password"
clusterStatsConfiguration:
monitorType: JMX
```

#### NOOP

This option disables health checks.
Original file line number Diff line number Diff line change
@@ -0,0 +1,153 @@
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.trino.gateway.ha.clustermonitor;

import com.fasterxml.jackson.databind.JsonNode;
import com.fasterxml.jackson.databind.ObjectMapper;
import io.airlift.log.Logger;
import io.trino.gateway.ha.config.BackendStateConfiguration;
import io.trino.gateway.ha.config.ProxyBackendConfiguration;
import okhttp3.Call;
import okhttp3.Credentials;
import okhttp3.OkHttpClient;
import okhttp3.Request;
import okhttp3.Response;

import java.io.IOException;

import static io.airlift.http.client.HttpStatus.fromStatusCode;
import static io.trino.gateway.ha.handler.QueryIdCachingProxyHandler.JMX_PATH;

public class ClusterStatsJmxMonitor
implements ClusterStatsMonitor
{
private static final Logger log = Logger.get(ClusterStatsJmxMonitor.class);

private final String username;
private final String password;

public ClusterStatsJmxMonitor(BackendStateConfiguration backendStateConfiguration)
{
this.username = backendStateConfiguration.getUsername();
this.password = backendStateConfiguration.getPassword();
}

@Override
public ClusterStats monitor(ProxyBackendConfiguration backend)
{
log.info("Monitoring cluster stats for backend: %s", backend.getProxyTo());
ClusterStats.Builder clusterStats = ClusterStatsMonitor.getClusterStatsBuilder(backend);

// Fetch DiscoveryNodeManager stats
String discoveryResponse = queryJmx(backend, "trino.metadata:name=DiscoveryNodeManager");
if (discoveryResponse != null) {
processDiscoveryNodeManagerStats(discoveryResponse, clusterStats);
}

// Fetch QueryManager stats
String queryResponse = queryJmx(backend, "trino.execution:name=QueryManager");
if (queryResponse != null) {
processQueryManagerStats(queryResponse, clusterStats);
}

// Set additional fields
clusterStats.proxyTo(backend.getProxyTo())
.externalUrl(backend.getExternalUrl())
.routingGroup(backend.getRoutingGroup());

ClusterStats stats = clusterStats.build();
log.debug("Completed monitoring for backend: %s. Stats: %s", backend.getProxyTo(), stats);
return stats;
}

private void processDiscoveryNodeManagerStats(String response, ClusterStats.Builder clusterStats)
{
try {
JsonNode rootNode = new ObjectMapper().readTree(response);
JsonNode attributes = rootNode.get("attributes");
if (attributes.isArray()) {
for (JsonNode attribute : attributes) {
if ("ActiveNodeCount".equals(attribute.get("name").asText())) {
int activeNodes = attribute.get("value").asInt();
clusterStats.numWorkerNodes(activeNodes)
.healthy(activeNodes - 1 > 0);
log.debug("Processed DiscoveryNodeManager: ActiveNodeCount = %d, Health = %s",
activeNodes, activeNodes - 1 > 0 ? "Healthy" : "Unhealthy");
break;
}
}
}
}
catch (Exception e) {
log.error(e, "Error parsing DiscoveryNodeManager stats");
}
}

private void processQueryManagerStats(String response, ClusterStats.Builder clusterStats)
{
try {
JsonNode rootNode = new ObjectMapper().readTree(response);
JsonNode attributes = rootNode.get("attributes");
if (attributes.isArray()) {
int queuedQueries = 0;
int runningQueries = 0;
for (JsonNode attribute : attributes) {
String name = attribute.get("name").asText();
if ("QueuedQueries".equals(name)) {
queuedQueries = attribute.get("value").asInt();
}
else if ("RunningQueries".equals(name)) {
runningQueries = attribute.get("value").asInt();
}
}
clusterStats.queuedQueryCount(queuedQueries).runningQueryCount(runningQueries);
log.debug("Processed QueryManager: QueuedQueries = %d, RunningQueries = %d",
queuedQueries, runningQueries);
}
}
catch (Exception e) {
log.error(e, "Error parsing QueryManager stats");
}
}

private String queryJmx(ProxyBackendConfiguration backend, String mbeanName)
{
String jmxUrl = backend.getProxyTo() + JMX_PATH + "/" + mbeanName;
log.debug("Querying JMX at URL: %s", jmxUrl);
OkHttpClient client = new OkHttpClient.Builder().build();

Request request = new Request.Builder()
.url(jmxUrl)
.addHeader("Authorization", Credentials.basic(username, password))
.get()
.build();

Call call = client.newCall(request);

try (Response res = call.execute()) {
if (fromStatusCode(res.code()) == io.airlift.http.client.HttpStatus.OK) {
log.debug("Successful JMX response for %s", mbeanName);
return res.body().string();
}
else {
log.error("Failed to fetch JMX data for %s, response code: %d", mbeanName, res.code());
return null;
}
}
catch (IOException e) {
log.error(e, "Error querying JMX for %s", mbeanName);
return null;
}
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -18,5 +18,6 @@ public enum ClusterStatsMonitorType
NOOP,
INFO_API,
UI_API,
JDBC
JDBC,
JMX
}
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,7 @@ public class QueryIdCachingProxyHandler
public static final String OAUTH_PATH = "/oauth2";
public static final String AUTHORIZATION = "Authorization";
public static final String USER_HEADER = "X-Trino-User";
public static final String JMX_PATH = "/v1/jmx/mbean";

private QueryIdCachingProxyHandler() {}
}
Original file line number Diff line number Diff line change
Expand Up @@ -50,6 +50,7 @@ public ClusterStatsMonitor getClusterStatsMonitor(@ForMonitor HttpClient httpCli
case INFO_API -> new ClusterStatsInfoApiMonitor(httpClient, config.getMonitor());
case UI_API -> new ClusterStatsHttpMonitor(config.getBackendState());
case JDBC -> new ClusterStatsJdbcMonitor(config.getBackendState(), config.getMonitor());
case JMX -> new ClusterStatsJmxMonitor(config.getBackendState());
case NOOP -> new NoopClusterStatsMonitor();
};
}
Expand Down

0 comments on commit 82cf53d

Please sign in to comment.