Skip to content

Commit

Permalink
crc32 checksum of healthy (#105)
Browse files Browse the repository at this point in the history
  • Loading branch information
wlx5575 authored Aug 4, 2023
1 parent 5ecd284 commit 3bfe3e5
Show file tree
Hide file tree
Showing 6 changed files with 176 additions and 6 deletions.
1 change: 1 addition & 0 deletions src/main/java/com/jd/jdbc/common/util/CollectionUtils.java
Original file line number Diff line number Diff line change
Expand Up @@ -47,4 +47,5 @@ public static boolean isNotEmpty(Map<?, ?> map) {
public static boolean isNotEmpty(Object[] array) {
return array != null && array.length > 0;
}

}
38 changes: 38 additions & 0 deletions src/main/java/com/jd/jdbc/common/util/Crc32Utill.java
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
/*
Copyright 2021 JD Project Authors.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/

package com.jd.jdbc.common.util;

import java.util.zip.CRC32;

public class Crc32Utill {

private Crc32Utill() {
}

public static long checksumByCrc32(byte[] b) {
CRC32 crc32 = new CRC32();
crc32.update(b);
return crc32.getValue();
}

public static long checksumByCrc32(int b) {
CRC32 crc32 = new CRC32();
crc32.update(b);
return crc32.getValue();
}

}
3 changes: 2 additions & 1 deletion src/main/java/com/jd/jdbc/discovery/HealthCheck.java
Original file line number Diff line number Diff line change
Expand Up @@ -41,6 +41,7 @@
import java.util.Objects;
import java.util.Timer;
import java.util.TimerTask;
import java.util.TreeMap;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.CopyOnWriteArrayList;
import java.util.concurrent.atomic.AtomicInteger;
Expand Down Expand Up @@ -131,7 +132,7 @@ public Map<String, TabletHealthCheck> getHealthByAliasCopy() {
}

public Map<String, List<TabletHealthCheck>> getHealthyCopy() {
return new HashMap<>(healthy);
return new TreeMap<>(healthy);
}

public IQueryService tabletConnection(Topodata.TabletAlias alias) {
Expand Down
61 changes: 59 additions & 2 deletions src/main/java/com/jd/jdbc/monitor/HealthyCollector.java
Original file line number Diff line number Diff line change
Expand Up @@ -16,11 +16,14 @@

package com.jd.jdbc.monitor;

import com.google.common.collect.Lists;
import com.jd.jdbc.common.util.Crc32Utill;
import com.jd.jdbc.discovery.HealthCheck;
import com.jd.jdbc.discovery.TabletHealthCheck;
import io.prometheus.client.Collector;
import io.prometheus.client.GaugeMetricFamily;
import java.util.Collections;
import java.util.ArrayList;
import java.util.Comparator;
import java.util.List;
import java.util.Map;

Expand All @@ -31,6 +34,12 @@ public final class HealthyCollector extends Collector {

private static final HealthyCollector HEALTH_CHECK_COLLECTOR = new HealthyCollector();

private static final List<String> LABEL_NAME_HEALTHY = Lists.newArrayList("HealthyChecksum");

private static final String COLLECT_NAME_HEALTHY = "HealthyChecksum";

private static final String COLLECT_HELP_HEALTHY = "crc32 checksum of the current healthCheck.healthy state ";

private HealthyCollector() {
}

Expand All @@ -55,6 +64,54 @@ public List<MetricFamilySamples> collect() {
HealthCheckCollector.buildGaugeMetric(labeledGauge, notServing, tabletHealthCheck);
}
}
return Collections.singletonList(labeledGauge);

GaugeMetricFamily labeledGaugeCheckSum = collectChecksum(healthyCopy);

List<MetricFamilySamples> ret = new ArrayList<>();
ret.add(labeledGauge);
ret.add(labeledGaugeCheckSum);
return ret;
}

public GaugeMetricFamily collectChecksum(Map<String, List<TabletHealthCheck>> healthy) {
GaugeMetricFamily labeledGaugeSum = new GaugeMetricFamily(COLLECT_NAME_HEALTHY, COLLECT_HELP_HEALTHY, LABEL_NAME_HEALTHY);

long crc32Val = stateHealthyChecksum(healthy);
List<String> healthyLV = Lists.newArrayList(Long.toString(crc32Val));
labeledGaugeSum.addMetric(healthyLV, crc32Val);
return labeledGaugeSum;
}

public static long stateHealthyChecksum(Map<String, List<TabletHealthCheck>> healthy) {
StringBuilder sb = new StringBuilder();

for (List<TabletHealthCheck> tabletHealthCheckList : healthy.values()) {
tabletHealthCheckList.sort(new Comparator<TabletHealthCheck>() {
@Override
public int compare(TabletHealthCheck o1, TabletHealthCheck o2) {
return Long.compare(o1.getTablet().getAlias().getUid(), o2.getTablet().getAlias().getUid());
}
});

for (TabletHealthCheck tabletHealthCheck : tabletHealthCheckList) {
if (!tabletHealthCheck.getServing().get()) {
// ignore noserving
continue;
}
sb.append(tabletHealthCheck.getTarget().getCell());
sb.append(tabletHealthCheck.getTarget().getKeyspace());
sb.append(tabletHealthCheck.getTarget().getShard());
sb.append(tabletHealthCheck.getTarget().getTabletType());
sb.append("\n");
sb.append(tabletHealthCheck.getTablet().getAlias());
sb.append(tabletHealthCheck.getTablet().getHostname());
sb.append(tabletHealthCheck.getTablet().getMysqlPort());
sb.append("\n");
sb.append(tabletHealthCheck.getMasterTermStartTime());
sb.append("\n");
}
}
return Crc32Utill.checksumByCrc32(sb.toString().getBytes());
}

}
13 changes: 10 additions & 3 deletions src/main/java/com/jd/jdbc/srvtopo/ResilientServer.java
Original file line number Diff line number Diff line change
Expand Up @@ -19,13 +19,13 @@
package com.jd.jdbc.srvtopo;

import com.google.common.util.concurrent.ThreadFactoryBuilder;
import com.jd.jdbc.common.util.Crc32Utill;
import com.jd.jdbc.context.IContext;
import com.jd.jdbc.context.VtContext;
import com.jd.jdbc.key.CurrentShard;
import com.jd.jdbc.monitor.SrvKeyspaceCollector;
import com.jd.jdbc.sqlparser.support.logging.Log;
import com.jd.jdbc.sqlparser.support.logging.LogFactory;
import com.jd.jdbc.sqlparser.utils.Utils;
import com.jd.jdbc.topo.Topo;
import com.jd.jdbc.topo.TopoException;
import com.jd.jdbc.topo.TopoExceptionCode;
Expand Down Expand Up @@ -93,12 +93,19 @@ public class ResilientServer implements SrvTopoServer {
public List<SrvKeyspaceCollector.Info> getSrvKeyspaceCollectorInfo() {
List<SrvKeyspaceCollector.Info> infoList = new ArrayList<>();
Map<String, SrvKeyspaceEntry> map = new HashMap<>(srvKeyspaceCache);

for (Map.Entry<String, SrvKeyspaceEntry> entry : map.entrySet()) {
String keyspaceCell = entry.getKey();
String[] split = keyspaceCell.split("\\.");
Topodata.SrvKeyspace srvKeyspace = entry.getValue().value;
String md5 = srvKeyspace == null ? "" : Utils.md5(srvKeyspace.toString());
SrvKeyspaceCollector.Info info = new SrvKeyspaceCollector.Info(md5, split[0], split[1]);
long infoCrc32;

if (srvKeyspace == null) {
infoCrc32 = 0;
} else {
infoCrc32 = Crc32Utill.checksumByCrc32(srvKeyspace.toString().getBytes());
}
SrvKeyspaceCollector.Info info = new SrvKeyspaceCollector.Info(Long.toString(infoCrc32), split[0], split[1]);
infoList.add(info);
}
return infoList;
Expand Down
66 changes: 66 additions & 0 deletions src/test/java/com/jd/jdbc/discovery/HealthCheckTest.java
Original file line number Diff line number Diff line change
Expand Up @@ -21,6 +21,7 @@
import com.jd.jdbc.context.IContext;
import com.jd.jdbc.context.VtContext;
import com.jd.jdbc.discovery.TabletHealthCheck.TabletStreamHealthStatus;
import com.jd.jdbc.monitor.HealthyCollector;
import com.jd.jdbc.queryservice.CombinedQueryService;
import com.jd.jdbc.queryservice.IParentQueryService;
import com.jd.jdbc.queryservice.MockQueryServer;
Expand All @@ -40,6 +41,7 @@
import io.vitess.proto.Query;
import io.vitess.proto.Topodata;
import java.io.IOException;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
Expand Down Expand Up @@ -839,6 +841,70 @@ public void testMysqlPort3358to0() throws IOException, InterruptedException {
printOk();
}

@Test
public void testHealthyListChecksum() {
HealthCheck hc = getHealthCheck();
Topodata.Tablet tablet1 = buildTablet("cella", 7, "1.1.1.7", "k", "s", portMap, Topodata.TabletType.REPLICA);
Topodata.Tablet tablet2 = buildTablet("cella", 8, "1.1.1.8", "k", "s", portMap, Topodata.TabletType.REPLICA);
Query.Target target = Query.Target.newBuilder().setKeyspace(tablet1.getKeyspace()).setShard(tablet1.getShard()).setTabletType(tablet1.getType()).build();


Map<String, List<TabletHealthCheck>> healthy1 = hc.getHealthyCopy();
List<TabletHealthCheck> healthyMap1 = new ArrayList<>();

TabletHealthCheck thc1 = new TabletHealthCheck(null, tablet1, target);
thc1.getServing().set(true);
TabletHealthCheck thc2 = new TabletHealthCheck(null, tablet2, target);
thc2.getServing().set(true);

healthyMap1.add(thc1);
healthyMap1.add(thc2);
healthy1.put("k1", healthyMap1);

Map<String, List<TabletHealthCheck>> healthy2 = hc.getHealthyCopy();
List<TabletHealthCheck> healthyMap2 = new ArrayList<>();
healthyMap2.add(thc2);
healthyMap2.add(thc1);
healthy2.put("k1", healthyMap2);

long healthy1Crc32 = HealthyCollector.stateHealthyChecksum(healthy1);
long healthy2Crc32 = HealthyCollector.stateHealthyChecksum(healthy2);
Assert.assertEquals("Wrong HealthyChecksum", healthy1Crc32, healthy2Crc32);
}

@Test
public void testHealthyChecksumSetBehindMaster() throws IOException, InterruptedException {
HealthCheck hc = getHealthCheck();
// add tablet
String keyInHealthy = "k.s.replica";
MockTablet mockTablet1 = buildMockTablet("cella", 7, "1.1.1.7", "k", "s", portMap, Topodata.TabletType.REPLICA);
MockTablet mockTablet2 = buildMockTablet("cella", 8, "1.1.1.8", "k", "s", portMap, Topodata.TabletType.REPLICA);

hc.addTablet(mockTablet1.getTablet());
hc.addTablet(mockTablet2.getTablet());
Thread.sleep(200);
sendOnNextMessage(mockTablet1, Topodata.TabletType.REPLICA, true, 0, 0.5, 1);
sendOnNextMessage(mockTablet2, Topodata.TabletType.REPLICA, true, 0, 0.5, 2);
Thread.sleep(200);

// sort list in healthy order by secondsBehindMaster
hc.recomputeHealthyLocked(keyInHealthy);
long firstCrc32 = HealthyCollector.stateHealthyChecksum(hc.getHealthyCopy());

sendOnNextMessage(mockTablet1, Topodata.TabletType.REPLICA, true, 0, 0.5, 2);
sendOnNextMessage(mockTablet2, Topodata.TabletType.REPLICA, true, 0, 0.5, 1);
Thread.sleep(200);

// sort list in healthy order by secondsBehindMaster
hc.recomputeHealthyLocked(keyInHealthy);
long secondCrc32 = HealthyCollector.stateHealthyChecksum(hc.getHealthyCopy());

Assert.assertNotEquals(hc.getHealthyCopy().get(keyInHealthy).get(0).getTablet().getHostname(), hc.getHealthyCopy().get(keyInHealthy).get(1).getTablet().getHostname());
Assert.assertEquals("Wrong HealthyChecksum", firstCrc32, secondCrc32);

closeQueryService(mockTablet1, mockTablet2);
}

private void startWatchTopo(String keyspaceName, TopoServer topoServer, String... cells) {
for (String cell : cells) {
TopologyWatcherManager.INSTANCE.startWatch(globalContext, topoServer, cell, keyspaceName);
Expand Down

0 comments on commit 3bfe3e5

Please sign in to comment.