From e61f0596279184782f2a5ffe92eb4988577e06db Mon Sep 17 00:00:00 2001 From: Norbert Kalmar Date: Thu, 18 Apr 2019 19:17:48 +0200 Subject: [PATCH] ZOOKEEPER-3037: Add JVMPauseMonitor https://issues.apache.org/jira/browse/ZOOKEEPER-3037 Author: Norbert Kalmar Reviewers: andor@apache.org Closes #904 from nkalmar/ZOOKEEPER-3037 and squashes the following commits: a6105324b [Norbert Kalmar] ZOOKEEPER-3037 - add serviceStop() and improve unit tests 7d0baaa46 [Norbert Kalmar] ZOOKEEPER-3037 - refactor unit tests 97d2c6103 [Norbert Kalmar] ZOOKEEPER-3037 - cite hadoop-common as source 3661389e4 [Norbert Kalmar] ZOOKEEPER-3037 - Add unit test and various improvements f30975765 [Norbert Kalmar] ZOOKEEPER-3037 - Add JvmPauseMonitor (cherry picked from commit e9adf6ee09ef18258653d65c851fa84c3cd1a51d) Change-Id: I7654fc85168bf163bdbbe96ebf73cb9ccf265e81 --- .../apache/zookeeper/server/ServerConfig.java | 26 +++ .../zookeeper/server/ZooKeeperServer.java | 27 +++ .../zookeeper/server/ZooKeeperServerMain.java | 10 +- .../zookeeper/server/quorum/QuorumPeer.java | 16 ++ .../server/quorum/QuorumPeerConfig.java | 45 +++- .../server/quorum/QuorumPeerMain.java | 5 + .../server/util/JvmPauseMonitor.java | 209 ++++++++++++++++++ .../apache/zookeeper/ServerConfigTest.java | 23 ++ .../server/quorum/QuorumPeerConfigTest.java | 23 ++ .../server/util/JvmPauseMonitorTest.java | 75 +++++++ 10 files changed, 454 insertions(+), 5 deletions(-) create mode 100644 zookeeper-server/src/main/java/org/apache/zookeeper/server/util/JvmPauseMonitor.java create mode 100644 zookeeper-server/src/test/java/org/apache/zookeeper/server/util/JvmPauseMonitorTest.java diff --git a/zookeeper-server/src/main/java/org/apache/zookeeper/server/ServerConfig.java b/zookeeper-server/src/main/java/org/apache/zookeeper/server/ServerConfig.java index dd3f1da9d0c..6b3d1ed4953 100644 --- a/zookeeper-server/src/main/java/org/apache/zookeeper/server/ServerConfig.java +++ b/zookeeper-server/src/main/java/org/apache/zookeeper/server/ServerConfig.java @@ -49,6 +49,15 @@ public class ServerConfig { /** defaults to -1 if not set explicitly */ protected int maxSessionTimeout = -1; + /** JVM Pause Monitor feature switch */ + protected boolean jvmPauseMonitorToRun = false; + /** JVM Pause Monitor warn threshold in ms */ + protected long jvmPauseWarnThresholdMs; + /** JVM Pause Monitor info threshold in ms */ + protected long jvmPauseInfoThresholdMs; + /** JVM Pause Monitor sleep time in ms */ + protected long jvmPauseSleepTimeMs; + /** * Parse arguments for server configuration * @param args clientPort dataDir and optional tickTime and maxClientCnxns @@ -99,6 +108,10 @@ public void readFrom(QuorumPeerConfig config) { maxClientCnxns = config.getMaxClientCnxns(); minSessionTimeout = config.getMinSessionTimeout(); maxSessionTimeout = config.getMaxSessionTimeout(); + jvmPauseMonitorToRun = config.isJvmPauseMonitorToRun(); + jvmPauseInfoThresholdMs = config.getJvmPauseInfoThresholdMs(); + jvmPauseWarnThresholdMs = config.getJvmPauseWarnThresholdMs(); + jvmPauseSleepTimeMs = config.getJvmPauseSleepTimeMs(); } public InetSocketAddress getClientPortAddress() { @@ -115,4 +128,17 @@ public InetSocketAddress getSecureClientPortAddress() { public int getMinSessionTimeout() { return minSessionTimeout; } /** maximum session timeout in milliseconds, -1 if unset */ public int getMaxSessionTimeout() { return maxSessionTimeout; } + + public long getJvmPauseInfoThresholdMs() { + return jvmPauseInfoThresholdMs; + } + public long getJvmPauseWarnThresholdMs() { + return jvmPauseWarnThresholdMs; + } + public long getJvmPauseSleepTimeMs() { + return jvmPauseSleepTimeMs; + } + public boolean isJvmPauseMonitorToRun() { + return jvmPauseMonitorToRun; + } } diff --git a/zookeeper-server/src/main/java/org/apache/zookeeper/server/ZooKeeperServer.java b/zookeeper-server/src/main/java/org/apache/zookeeper/server/ZooKeeperServer.java index 3f3c430775b..c6f6b6ac190 100644 --- a/zookeeper-server/src/main/java/org/apache/zookeeper/server/ZooKeeperServer.java +++ b/zookeeper-server/src/main/java/org/apache/zookeeper/server/ZooKeeperServer.java @@ -70,6 +70,7 @@ import org.apache.zookeeper.server.quorum.QuorumPeerConfig; import org.apache.zookeeper.server.quorum.QuorumPeerConfig; import org.apache.zookeeper.server.quorum.ReadOnlyZooKeeperServer; +import org.apache.zookeeper.server.util.JvmPauseMonitor; import org.apache.zookeeper.txn.CreateSessionTxn; import org.apache.zookeeper.txn.TxnHeader; import org.slf4j.Logger; @@ -109,6 +110,7 @@ public class ZooKeeperServer implements SessionExpirer, ServerStats.Provider { private final AtomicLong hzxid = new AtomicLong(0); public final static Exception ok = new Exception("No prob"); protected RequestProcessor firstProcessor; + protected JvmPauseMonitor jvmPauseMonitor; protected volatile State state = State.INITIAL; protected boolean reconfigEnabled; @@ -187,6 +189,20 @@ public ZooKeeperServer(FileTxnSnapLog txnLogFactory, int tickTime, + " snapdir " + txnLogFactory.getSnapDir()); } + /** + * Adds JvmPauseMonitor and calls + * {@link #ZooKeeperServer(FileTxnSnapLog, int, int, int, ZKDatabase, boolean)} + * + */ + public ZooKeeperServer(JvmPauseMonitor jvmPauseMonitor, FileTxnSnapLog txnLogFactory, int tickTime, + int minSessionTimeout, int maxSessionTimeout, ZKDatabase zkDb, boolean reconfigEnabled) { + this(txnLogFactory, tickTime, minSessionTimeout, maxSessionTimeout, zkDb, reconfigEnabled); + this.jvmPauseMonitor = jvmPauseMonitor; + if(jvmPauseMonitor != null) { + LOG.info("Added JvmPauseMonitor to server"); + } + } + /** * creates a zookeeperserver instance. * @param txnLogFactory the file transaction snapshot logging class @@ -477,10 +493,18 @@ public synchronized void startup() { registerJMX(); + startJvmPauseMonitor(); + setState(State.RUNNING); notifyAll(); } + protected void startJvmPauseMonitor() { + if (this.jvmPauseMonitor != null) { + this.jvmPauseMonitor.serviceStart(); + } + } + protected void setupRequestProcessors() { RequestProcessor finalProcessor = new FinalRequestProcessor(this); RequestProcessor syncProcessor = new SyncRequestProcessor(this, @@ -585,6 +609,9 @@ public synchronized void shutdown(boolean fullyShutDown) { if (firstProcessor != null) { firstProcessor.shutdown(); } + if(jvmPauseMonitor != null) { + jvmPauseMonitor.serviceStop(); + } if (zkDb != null) { if (fullyShutDown) { diff --git a/zookeeper-server/src/main/java/org/apache/zookeeper/server/ZooKeeperServerMain.java b/zookeeper-server/src/main/java/org/apache/zookeeper/server/ZooKeeperServerMain.java index 0cfcf6ddbef..d9d56e564f1 100644 --- a/zookeeper-server/src/main/java/org/apache/zookeeper/server/ZooKeeperServerMain.java +++ b/zookeeper-server/src/main/java/org/apache/zookeeper/server/ZooKeeperServerMain.java @@ -34,6 +34,7 @@ import org.apache.zookeeper.server.persistence.FileTxnSnapLog.DatadirException; import org.apache.zookeeper.server.quorum.QuorumPeerConfig; import org.apache.zookeeper.server.quorum.QuorumPeerConfig.ConfigException; +import org.apache.zookeeper.server.util.JvmPauseMonitor; import org.slf4j.Logger; import org.slf4j.LoggerFactory; @@ -125,8 +126,13 @@ public void runFromConfig(ServerConfig config) // run() in this thread. // create a file logger url from the command line args txnLog = new FileTxnSnapLog(config.dataLogDir, config.dataDir); - final ZooKeeperServer zkServer = new ZooKeeperServer(txnLog, - config.tickTime, config.minSessionTimeout, config.maxSessionTimeout, null, QuorumPeerConfig.isReconfigEnabled()); + JvmPauseMonitor jvmPauseMonitor = null; + if(config.jvmPauseMonitorToRun) { + jvmPauseMonitor = new JvmPauseMonitor(config); + } + final ZooKeeperServer zkServer = new ZooKeeperServer(jvmPauseMonitor, txnLog, + config.tickTime, config.minSessionTimeout, config.maxSessionTimeout, + null, QuorumPeerConfig.isReconfigEnabled()); txnLog.setServerStats(zkServer.serverStats()); // Registers shutdown handler which will be used to know the diff --git a/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeer.java b/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeer.java index 5c52b698432..418b1a2ac27 100644 --- a/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeer.java +++ b/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeer.java @@ -72,6 +72,7 @@ import org.apache.zookeeper.server.quorum.QuorumPeerConfig.ConfigException; import org.apache.zookeeper.server.quorum.flexible.QuorumMaj; import org.apache.zookeeper.server.quorum.flexible.QuorumVerifier; +import org.apache.zookeeper.server.util.JvmPauseMonitor; import org.apache.zookeeper.server.util.ZxidUtils; import org.slf4j.Logger; import org.slf4j.LoggerFactory; @@ -127,6 +128,7 @@ public class QuorumPeer extends ZooKeeperThread implements QuorumStats.Provider */ private ZKDatabase zkDb; + private JvmPauseMonitor jvmPauseMonitor; public static final class AddressTuple { public final InetSocketAddress quorumAddr; public final InetSocketAddress electionAddr; @@ -468,6 +470,10 @@ public int getQuorumSize(){ return getVotingView().size(); } + public void setJvmPauseMonitor(JvmPauseMonitor jvmPauseMonitor) { + this.jvmPauseMonitor = jvmPauseMonitor; + } + /** * QuorumVerifier implementation; default (majority). */ @@ -914,6 +920,7 @@ public synchronized void start() { System.out.println(e); } startLeaderElection(); + startJvmPauseMonitor(); super.start(); } @@ -992,6 +999,12 @@ synchronized public void startLeaderElection() { this.electionAlg = createElectionAlgorithm(electionType); } + private void startJvmPauseMonitor() { + if (this.jvmPauseMonitor != null) { + this.jvmPauseMonitor.serviceStart(); + } + } + /** * Count the number of nodes in the map that could be followers. * @param peers @@ -1351,6 +1364,9 @@ public void shutdown() { if(udpSocket != null) { udpSocket.close(); } + if(jvmPauseMonitor != null) { + jvmPauseMonitor.serviceStop(); + } try { adminServer.shutdown(); diff --git a/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeerConfig.java b/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeerConfig.java index dc5aec28937..56daffc0d47 100644 --- a/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeerConfig.java +++ b/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeerConfig.java @@ -39,6 +39,7 @@ import org.apache.yetus.audience.InterfaceAudience; import org.apache.zookeeper.common.ClientX509Util; import org.apache.zookeeper.common.StringUtils; +import org.apache.zookeeper.server.util.JvmPauseMonitor; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import org.slf4j.MDC; @@ -114,6 +115,23 @@ public class QuorumPeerConfig { */ private final int MIN_SNAP_RETAIN_COUNT = 3; + /** + * JVM Pause Monitor feature switch + */ + protected boolean jvmPauseMonitorToRun = false; + /** + * JVM Pause Monitor warn threshold in ms + */ + protected long jvmPauseWarnThresholdMs = JvmPauseMonitor.WARN_THRESHOLD_DEFAULT; + /** + * JVM Pause Monitor info threshold in ms + */ + protected long jvmPauseInfoThresholdMs = JvmPauseMonitor.INFO_THRESHOLD_DEFAULT; + /** + * JVM Pause Monitor sleep time in ms + */ + protected long jvmPauseSleepTimeMs = JvmPauseMonitor.SLEEP_TIME_MS_DEFAULT; + @SuppressWarnings("serial") public static class ConfigException extends Exception { public ConfigException(String msg) { @@ -328,6 +346,14 @@ public void parseProperties(Properties zkProp) quorumServicePrincipal = value; } else if (key.equals("quorum.cnxn.threads.size")) { quorumCnxnThreadsSize = Integer.parseInt(value); + } else if (key.equals(JvmPauseMonitor.INFO_THRESHOLD_KEY)) { + jvmPauseInfoThresholdMs = Long.parseLong(value); + } else if (key.equals(JvmPauseMonitor.WARN_THRESHOLD_KEY)) { + jvmPauseWarnThresholdMs = Long.parseLong(value); + } else if (key.equals(JvmPauseMonitor.SLEEP_TIME_MS_KEY)) { + jvmPauseSleepTimeMs = Long.parseLong(value); + } else if (key.equals(JvmPauseMonitor.JVM_PAUSE_MONITOR_FEATURE_SWITCH_KEY)) { + jvmPauseMonitorToRun = Boolean.parseBoolean(value); } else { System.setProperty("zookeeper." + key, value); } @@ -412,7 +438,7 @@ public void parseProperties(Properties zkProp) if (minSessionTimeout > maxSessionTimeout) { throw new IllegalArgumentException( "minSessionTimeout must not be larger than maxSessionTimeout"); - } + } // backward compatibility - dynamic configuration in the same file as // static configuration params see writeDynamicConfig() @@ -658,14 +684,14 @@ public static QuorumVerifier parseDynamicConfig(Properties dynamicConfigProp, in /* * If using FLE, then every server requires a separate election * port. - */ + */ if (eAlg != 0) { for (QuorumServer s : qv.getVotingMembers().values()) { if (s.electionAddr == null) throw new IllegalArgumentException( "Missing election port for server: " + s.id); } - } + } } return qv; } @@ -786,6 +812,19 @@ public Map getServers() { return Collections.unmodifiableMap(quorumVerifier.getAllMembers()); } + public long getJvmPauseInfoThresholdMs() { + return jvmPauseInfoThresholdMs; + } + public long getJvmPauseWarnThresholdMs() { + return jvmPauseWarnThresholdMs; + } + public long getJvmPauseSleepTimeMs() { + return jvmPauseSleepTimeMs; + } + public boolean isJvmPauseMonitorToRun() { + return jvmPauseMonitorToRun; + } + public long getServerId() { return serverId; } public boolean isDistributed() { diff --git a/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeerMain.java b/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeerMain.java index b90e9f44773..fe73c5461d4 100644 --- a/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeerMain.java +++ b/zookeeper-server/src/main/java/org/apache/zookeeper/server/quorum/QuorumPeerMain.java @@ -23,6 +23,7 @@ import javax.security.sasl.SaslException; import org.apache.yetus.audience.InterfaceAudience; +import org.apache.zookeeper.server.util.JvmPauseMonitor; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import org.apache.zookeeper.jmx.ManagedUtil; @@ -204,6 +205,10 @@ public void runFromConfig(QuorumPeerConfig config) quorumPeer.setQuorumCnxnThreadsSize(config.quorumCnxnThreadsSize); quorumPeer.initialize(); + if(config.jvmPauseMonitorToRun) { + quorumPeer.setJvmPauseMonitor(new JvmPauseMonitor(config)); + } + quorumPeer.start(); quorumPeer.join(); } catch (InterruptedException e) { diff --git a/zookeeper-server/src/main/java/org/apache/zookeeper/server/util/JvmPauseMonitor.java b/zookeeper-server/src/main/java/org/apache/zookeeper/server/util/JvmPauseMonitor.java new file mode 100644 index 00000000000..0ce617fe8e8 --- /dev/null +++ b/zookeeper-server/src/main/java/org/apache/zookeeper/server/util/JvmPauseMonitor.java @@ -0,0 +1,209 @@ +/** + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.zookeeper.server.util; + +import org.apache.zookeeper.server.ServerConfig; +import org.apache.zookeeper.server.quorum.QuorumPeerConfig; +import org.slf4j.Logger; +import org.slf4j.LoggerFactory; + +import java.lang.management.GarbageCollectorMXBean; +import java.lang.management.ManagementFactory; +import java.time.Instant; +import java.util.ArrayList; +import java.util.HashSet; +import java.util.HashMap; +import java.util.Map; +import java.util.Set; +import java.util.List; + +/** + * This code is originally from hadoop-common, see: + * https://github.com/apache/hadoop/blob/trunk/hadoop-common-project/hadoop-common/src/main/java/org/apache/hadoop/util/JvmPauseMonitor.java + * + * Class which sets up a simple thread which runs in a loop sleeping + * for a short interval of time. If the sleep takes significantly longer + * than its target time, it implies that the JVM or host machine has + * paused processing, which may cause other problems. If such a pause is + * detected, the thread logs a message. + */ +public class JvmPauseMonitor { + private static final Logger LOG = LoggerFactory.getLogger(JvmPauseMonitor.class); + + public static final String JVM_PAUSE_MONITOR_FEATURE_SWITCH_KEY = "jvm.pause.monitor"; + + /** The target sleep time */ + protected long sleepTimeMs; + public static final String SLEEP_TIME_MS_KEY = "jvm.pause.sleep.time.ms"; + public static final long SLEEP_TIME_MS_DEFAULT = 500; + + /** log WARN if we detect a pause longer than this threshold */ + protected long warnThresholdMs; + public static final String WARN_THRESHOLD_KEY = "jvm.pause.warn-threshold.ms"; + public static final long WARN_THRESHOLD_DEFAULT = 10000; + + /** log INFO if we detect a pause longer than this threshold */ + protected long infoThresholdMs; + public static final String INFO_THRESHOLD_KEY = "jvm.pause.info-threshold.ms"; + public static final long INFO_THRESHOLD_DEFAULT = 1000; + + private long numGcWarnThresholdExceeded = 0; + private long numGcInfoThresholdExceeded = 0; + private long totalGcExtraSleepTime = 0; + + private Thread monitorThread; + private volatile boolean shouldRun = true; + + public JvmPauseMonitor(QuorumPeerConfig config) { + this.warnThresholdMs = config.getJvmPauseWarnThresholdMs(); + this.infoThresholdMs = config.getJvmPauseInfoThresholdMs(); + this.sleepTimeMs = config.getJvmPauseSleepTimeMs(); + } + + public JvmPauseMonitor(ServerConfig config) { + this.warnThresholdMs = config.getJvmPauseWarnThresholdMs(); + this.infoThresholdMs = config.getJvmPauseInfoThresholdMs(); + this.sleepTimeMs = config.getJvmPauseSleepTimeMs(); + } + + public void serviceStart() { + monitorThread = new Thread(new JVMMonitor()); + monitorThread.setDaemon(true); + monitorThread.start(); + } + + public void serviceStop() { + shouldRun = false; + if (monitorThread != null) { + monitorThread.interrupt(); + try { + monitorThread.join(); + } catch (InterruptedException e) { + Thread.currentThread().interrupt(); + } + } + } + + public boolean isStarted() { + return monitorThread != null; + } + + public long getNumGcWarnThresholdExceeded() { + return numGcWarnThresholdExceeded; + } + + public long getNumGcInfoThresholdExceeded() { + return numGcInfoThresholdExceeded; + } + + public long getTotalGcExtraSleepTime() { + return totalGcExtraSleepTime; + } + + private String formatMessage(long extraSleepTime, + Map gcTimesAfterSleep, + Map gcTimesBeforeSleep) { + + Set gcBeanNames = new HashSet<>(gcTimesAfterSleep.keySet()); + gcBeanNames.retainAll(gcTimesBeforeSleep.keySet()); + List gcDiffs = new ArrayList<>(); + + for (String name : gcBeanNames) { + GcTimes diff = gcTimesAfterSleep.get(name).subtract(gcTimesBeforeSleep.get(name)); + if (diff.gcCount != 0) { + gcDiffs.add("GC pool '" + name + "' had collection(s): " + diff.toString()); + } + } + + String ret = String.format("Detected pause in JVM or host machine (eg GC): pause of approximately %d ms, " + + "total pause: info level: %d, warn level: %d %n", + extraSleepTime, numGcInfoThresholdExceeded, numGcWarnThresholdExceeded); + if (gcDiffs.isEmpty()) { + ret += ("No GCs detected"); + } else { + ret += String.join("\n", gcDiffs); + } + return ret; + } + + private Map getGcTimes() { + Map map = new HashMap<>(); + List gcBeans = ManagementFactory.getGarbageCollectorMXBeans(); + for (GarbageCollectorMXBean gcBean : gcBeans) { + map.put(gcBean.getName(), new GcTimes(gcBean)); + } + return map; + } + + private static class GcTimes { + + private long gcCount; + private long gcTimeMillis; + + private GcTimes(GarbageCollectorMXBean gcBean) { + gcCount = gcBean.getCollectionCount(); + gcTimeMillis = gcBean.getCollectionTime(); + } + + private GcTimes(long count, long time) { + this.gcCount = count; + this.gcTimeMillis = time; + } + + private GcTimes subtract(GcTimes other) { + return new GcTimes(this.gcCount - other.gcCount, + this.gcTimeMillis - other.gcTimeMillis); + } + + public String toString() { + return "count=" + gcCount + " time=" + gcTimeMillis + "ms"; + } + + } + + private class JVMMonitor implements Runnable { + @Override + public void run() { + Map gcTimesBeforeSleep = getGcTimes(); + LOG.info("Starting JVM Pause Monitor with infoThresholdMs:{} warnThresholdMs:{} and sleepTimeMs:{}", + infoThresholdMs, warnThresholdMs, sleepTimeMs); + while (shouldRun) { + long startTime = Instant.now().toEpochMilli(); + try { + Thread.sleep(sleepTimeMs); + } catch (InterruptedException ie) { + return; + } + long endTime = Instant.now().toEpochMilli(); + long extraSleepTime = (endTime - startTime) - sleepTimeMs; + Map gcTimesAfterSleep = getGcTimes(); + + if (extraSleepTime > warnThresholdMs) { + ++numGcWarnThresholdExceeded; + LOG.warn(formatMessage(extraSleepTime, gcTimesAfterSleep, gcTimesBeforeSleep)); + } else if (extraSleepTime > infoThresholdMs) { + ++numGcInfoThresholdExceeded; + LOG.info(formatMessage(extraSleepTime, gcTimesAfterSleep, gcTimesBeforeSleep)); + } + totalGcExtraSleepTime += extraSleepTime; + gcTimesBeforeSleep = gcTimesAfterSleep; + } + } + } +} \ No newline at end of file diff --git a/zookeeper-server/src/test/java/org/apache/zookeeper/ServerConfigTest.java b/zookeeper-server/src/test/java/org/apache/zookeeper/ServerConfigTest.java index 27faa745b6f..e542670481a 100644 --- a/zookeeper-server/src/test/java/org/apache/zookeeper/ServerConfigTest.java +++ b/zookeeper-server/src/test/java/org/apache/zookeeper/ServerConfigTest.java @@ -19,12 +19,15 @@ package org.apache.zookeeper; import org.apache.zookeeper.server.ServerConfig; +import org.apache.zookeeper.server.quorum.QuorumPeerConfig; import org.junit.Before; import org.junit.Test; import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertNotNull; import static org.junit.Assert.assertTrue; +import static org.mockito.Mockito.mock; +import static org.mockito.Mockito.when; import java.io.File; @@ -60,6 +63,26 @@ public void testTooManyArguments() { serverConfig.parse(args); } + @Test + public void testJvmPauseMonitorConfigured() { + final Long sleepTime = 444L; + final Long warnTH = 5555L; + final Long infoTH = 555L; + + QuorumPeerConfig qpConfig = mock(QuorumPeerConfig.class); + when(qpConfig.isJvmPauseMonitorToRun()).thenReturn(true); + when(qpConfig.getJvmPauseSleepTimeMs()).thenReturn(sleepTime); + when(qpConfig.getJvmPauseWarnThresholdMs()).thenReturn(warnTH); + when(qpConfig.getJvmPauseInfoThresholdMs()).thenReturn(infoTH); + + serverConfig.readFrom(qpConfig); + + assertEquals(sleepTime, Long.valueOf(serverConfig.getJvmPauseSleepTimeMs())); + assertEquals(warnTH, Long.valueOf(serverConfig.getJvmPauseWarnThresholdMs())); + assertEquals(infoTH, Long.valueOf(serverConfig.getJvmPauseInfoThresholdMs())); + assertTrue(serverConfig.isJvmPauseMonitorToRun()); + } + boolean checkEquality(String a, String b) { assertNotNull(a); assertNotNull(b); diff --git a/zookeeper-server/src/test/java/org/apache/zookeeper/server/quorum/QuorumPeerConfigTest.java b/zookeeper-server/src/test/java/org/apache/zookeeper/server/quorum/QuorumPeerConfigTest.java index 5dfd2d05611..d56a61882d1 100644 --- a/zookeeper-server/src/test/java/org/apache/zookeeper/server/quorum/QuorumPeerConfigTest.java +++ b/zookeeper-server/src/test/java/org/apache/zookeeper/server/quorum/QuorumPeerConfigTest.java @@ -20,6 +20,7 @@ import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertNotNull; +import static org.junit.Assert.assertTrue; import static org.junit.Assert.fail; import java.io.File; @@ -115,6 +116,28 @@ public void testSamePortConfiguredForClientAndElection() throws IOException, Con quorumPeerConfig.parseProperties(zkProp); } + @Test + public void testJvmPauseMonitorConfigured() + throws IOException, ConfigException { + final Long sleepTime = 444L; + final Long warnTH = 5555L; + final Long infoTH = 555L; + + QuorumPeerConfig quorumPeerConfig = new QuorumPeerConfig(); + Properties zkProp = getDefaultZKProperties(); + zkProp.setProperty("dataDir", new File("myDataDir").getAbsolutePath()); + zkProp.setProperty("jvm.pause.monitor", "true"); + zkProp.setProperty("jvm.pause.sleep.time.ms", sleepTime.toString()); + zkProp.setProperty("jvm.pause.warn-threshold.ms", warnTH.toString()); + zkProp.setProperty("jvm.pause.info-threshold.ms", infoTH.toString()); + quorumPeerConfig.parseProperties(zkProp); + + assertEquals(sleepTime, Long.valueOf(quorumPeerConfig.getJvmPauseSleepTimeMs())); + assertEquals(warnTH, Long.valueOf(quorumPeerConfig.getJvmPauseWarnThresholdMs())); + assertEquals(infoTH, Long.valueOf(quorumPeerConfig.getJvmPauseInfoThresholdMs())); + assertTrue(quorumPeerConfig.isJvmPauseMonitorToRun()); + } + private Properties getDefaultZKProperties() { Properties zkProp = new Properties(); zkProp.setProperty("dataDir", new File("myDataDir").getAbsolutePath()); diff --git a/zookeeper-server/src/test/java/org/apache/zookeeper/server/util/JvmPauseMonitorTest.java b/zookeeper-server/src/test/java/org/apache/zookeeper/server/util/JvmPauseMonitorTest.java new file mode 100644 index 00000000000..4e701b83d07 --- /dev/null +++ b/zookeeper-server/src/test/java/org/apache/zookeeper/server/util/JvmPauseMonitorTest.java @@ -0,0 +1,75 @@ +/** + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + +package org.apache.zookeeper.server.util; + +import org.apache.zookeeper.server.quorum.QuorumPeerConfig; +import org.junit.After; +import org.junit.Assert; +import org.junit.Test; + +import static org.mockito.Mockito.mock; +import static org.mockito.Mockito.when; + +public class JvmPauseMonitorTest { + + private final Long sleepTime = 100L; + private final Long infoTH = -1L; + private final Long warnTH = -1L; + private JvmPauseMonitor pauseMonitor; + + @Test(timeout=5000) + public void testJvmPauseMonitorExceedInfoThreshold() throws InterruptedException { + QuorumPeerConfig qpConfig = mock(QuorumPeerConfig.class); + when(qpConfig.getJvmPauseSleepTimeMs()).thenReturn(sleepTime); + when(qpConfig.getJvmPauseInfoThresholdMs()).thenReturn(infoTH); + + pauseMonitor = new JvmPauseMonitor(qpConfig); + pauseMonitor.serviceStart(); + + Assert.assertEquals(sleepTime, Long.valueOf(pauseMonitor.sleepTimeMs)); + Assert.assertEquals(infoTH, Long.valueOf(pauseMonitor.infoThresholdMs)); + + while(pauseMonitor.getNumGcInfoThresholdExceeded() == 0) { + Thread.sleep(200); + } + } + + @Test(timeout=5000) + public void testJvmPauseMonitorExceedWarnThreshold() throws InterruptedException { + QuorumPeerConfig qpConfig = mock(QuorumPeerConfig.class); + when(qpConfig.getJvmPauseSleepTimeMs()).thenReturn(sleepTime); + when(qpConfig.getJvmPauseWarnThresholdMs()).thenReturn(warnTH); + + pauseMonitor = new JvmPauseMonitor(qpConfig); + pauseMonitor.serviceStart(); + + Assert.assertEquals(sleepTime, Long.valueOf(pauseMonitor.sleepTimeMs)); + Assert.assertEquals(warnTH, Long.valueOf(pauseMonitor.warnThresholdMs)); + + while(pauseMonitor.getNumGcWarnThresholdExceeded() == 0) { + Thread.sleep(200); + } + + } + + @After + public void teardown() { + pauseMonitor.serviceStop(); + } +}