本文主要研究一下nacos的HttpHealthCheckProcessorjava
nacos-1.1.3/naming/src/main/java/com/alibaba/nacos/naming/healthcheck/HealthCheckProcessor.javagit
public interface HealthCheckProcessor { /** * Run check task for service * * @param task check task */ void process(HealthCheckTask task); /** * Get check task type, refer to enum HealthCheckType * * @return check type */ String getType(); }
nacos-1.1.3/naming/src/main/java/com/alibaba/nacos/naming/healthcheck/HttpHealthCheckProcessor.javagithub
@Component public class HttpHealthCheckProcessor implements HealthCheckProcessor { @Autowired private SwitchDomain switchDomain; @Autowired private HealthCheckCommon healthCheckCommon; private static AsyncHttpClient asyncHttpClient; private static final int CONNECT_TIMEOUT_MS = 500; static { try { AsyncHttpClientConfig.Builder builder = new AsyncHttpClientConfig.Builder(); builder.setMaximumConnectionsTotal(-1); builder.setMaximumConnectionsPerHost(-1); builder.setAllowPoolingConnection(false); builder.setFollowRedirects(false); builder.setIdleConnectionTimeoutInMs(CONNECT_TIMEOUT_MS); builder.setConnectionTimeoutInMs(CONNECT_TIMEOUT_MS); builder.setCompressionEnabled(false); builder.setIOThreadMultiplier(1); builder.setMaxRequestRetry(0); builder.setUserAgent("VIPServer"); asyncHttpClient = new AsyncHttpClient(builder.build()); } catch (Throwable e) { SRV_LOG.error("[HEALTH-CHECK] Error while constructing HTTP asynchronous client", e); } } @Override public String getType() { return "HTTP"; } @Override public void process(HealthCheckTask task) { List<Instance> ips = task.getCluster().allIPs(false); if (CollectionUtils.isEmpty(ips)) { return; } if (!switchDomain.isHealthCheckEnabled()) { return; } Cluster cluster = task.getCluster(); for (Instance ip : ips) { try { if (ip.isMarked()) { if (SRV_LOG.isDebugEnabled()) { SRV_LOG.debug("http check, ip is marked as to skip health check, ip: {}" + ip.getIp()); } continue; } if (!ip.markChecking()) { SRV_LOG.warn("http check started before last one finished, service: {}:{}:{}", task.getCluster().getService().getName(), task.getCluster().getName(), ip.getIp()); healthCheckCommon.reEvaluateCheckRT(task.getCheckRTNormalized() * 2, task, switchDomain.getHttpHealthParams()); continue; } AbstractHealthChecker.Http healthChecker = (AbstractHealthChecker.Http) cluster.getHealthChecker(); int ckPort = cluster.isUseIPPort4Check() ? ip.getPort() : cluster.getDefCkport(); URL host = new URL("http://" + ip.getIp() + ":" + ckPort); URL target = new URL(host, healthChecker.getPath()); AsyncHttpClient.BoundRequestBuilder builder = asyncHttpClient.prepareGet(target.toString()); Map<String, String> customHeaders = healthChecker.getCustomHeaders(); for (Map.Entry<String, String> entry : customHeaders.entrySet()) { if ("Host".equals(entry.getKey())) { builder.setVirtualHost(entry.getValue()); continue; } builder.setHeader(entry.getKey(), entry.getValue()); } builder.execute(new HttpHealthCheckCallback(ip, task)); MetricsMonitor.getHttpHealthCheckMonitor().incrementAndGet(); } catch (Throwable e) { ip.setCheckRT(switchDomain.getHttpHealthParams().getMax()); healthCheckCommon.checkFail(ip, task, "http:error:" + e.getMessage()); healthCheckCommon.reEvaluateCheckRT(switchDomain.getHttpHealthParams().getMax(), task, switchDomain.getHttpHealthParams()); } } } //...... }
nacos-1.1.3/naming/src/main/java/com/alibaba/nacos/naming/healthcheck/HttpHealthCheckProcessor.javaasync
private class HttpHealthCheckCallback extends AsyncCompletionHandler<Integer> { private Instance ip; private HealthCheckTask task; private long startTime = System.currentTimeMillis(); public HttpHealthCheckCallback(Instance ip, HealthCheckTask task) { this.ip = ip; this.task = task; } @Override public Integer onCompleted(Response response) throws Exception { ip.setCheckRT(System.currentTimeMillis() - startTime); int httpCode = response.getStatusCode(); if (HttpURLConnection.HTTP_OK == httpCode) { healthCheckCommon.checkOK(ip, task, "http:" + httpCode); healthCheckCommon.reEvaluateCheckRT(System.currentTimeMillis() - startTime, task, switchDomain.getHttpHealthParams()); } else if (HttpURLConnection.HTTP_UNAVAILABLE == httpCode || HttpURLConnection.HTTP_MOVED_TEMP == httpCode) { // server is busy, need verification later healthCheckCommon.checkFail(ip, task, "http:" + httpCode); healthCheckCommon.reEvaluateCheckRT(task.getCheckRTNormalized() * 2, task, switchDomain.getHttpHealthParams()); } else { //probably means the state files has been removed by administrator healthCheckCommon.checkFailNow(ip, task, "http:" + httpCode); healthCheckCommon.reEvaluateCheckRT(switchDomain.getHttpHealthParams().getMax(), task, switchDomain.getHttpHealthParams()); } return httpCode; } @Override public void onThrowable(Throwable t) { ip.setCheckRT(System.currentTimeMillis() - startTime); Throwable cause = t; int maxStackDepth = 50; for (int deepth = 0; deepth < maxStackDepth && cause != null; deepth++) { if (cause instanceof SocketTimeoutException || cause instanceof ConnectTimeoutException || cause instanceof org.jboss.netty.channel.ConnectTimeoutException || cause instanceof TimeoutException || cause.getCause() instanceof TimeoutException) { healthCheckCommon.checkFail(ip, task, "http:timeout:" + cause.getMessage()); healthCheckCommon.reEvaluateCheckRT(task.getCheckRTNormalized() * 2, task, switchDomain.getHttpHealthParams()); return; } cause = cause.getCause(); } // connection error, probably not reachable if (t instanceof ConnectException) { healthCheckCommon.checkFailNow(ip, task, "http:unable2connect:" + t.getMessage()); healthCheckCommon.reEvaluateCheckRT(switchDomain.getHttpHealthParams().getMax(), task, switchDomain.getHttpHealthParams()); } else { healthCheckCommon.checkFail(ip, task, "http:error:" + t.getMessage()); healthCheckCommon.reEvaluateCheckRT(switchDomain.getHttpHealthParams().getMax(), task, switchDomain.getHttpHealthParams()); } } }
HttpHealthCheckProcessor實現了HealthCheckProcessor接口,其static方法初始化了AsyncHttpClient;其getType返回的是HTTP;其process方法會遍歷instances,而後對於非marked及markChecking的執行health check,並註冊HttpHealthCheckCallback;對於非markChecking的或者出現異常的則執行healthCheckCommon.reEvaluateCheckRTide